diff --git "a/wandb/run-20211106_211610-dtkf2u0m/files/output.log" "b/wandb/run-20211106_211610-dtkf2u0m/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20211106_211610-dtkf2u0m/files/output.log" @@ -0,0 +1,3802 @@ +11/06/2021 21:16:12 - INFO - __main__ - Distributed environment: MULTI_GPU Backend: nccl +Num processes: 16 +Process index: 0 +Local process index: 0 +Device: cuda:0 +Use FP16 precision: True +/home/leandro/codeparrot-small/./ is already a clone of https://huggingface.co/lvwerra/codeparrot-small. Make sure you pull the latest changes with `repo.git_pull()`. +11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - /home/leandro/codeparrot-small/./ is already a clone of https://huggingface.co/lvwerra/codeparrot-small. Make sure you pull the latest changes with `repo.git_pull()`. +Revision `proud-haze-135` does not exist. Created and checked out branch `proud-haze-135`. +11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - Revision `proud-haze-135` does not exist. Created and checked out branch `proud-haze-135`. +11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - +loading configuration file ./config.json +Model config GPT2Config { + "activation_function": "gelu_new", + "architectures": [ + "GPT2LMHeadModel" + ], + "attn_pdrop": 0.1, + "bos_token_id": 50256, + "embd_pdrop": 0.1, + "eos_token_id": 50256, + "initializer_range": 0.02, + "layer_norm_epsilon": 1e-05, + "model_type": "gpt2", + "n_ctx": 1024, + "n_embd": 768, + "n_head": 12, + "n_inner": null, + "n_layer": 12, + "n_positions": 1024, + "reorder_and_upcast_attn": true, + "resid_pdrop": 0.1, + "scale_attn_by_inverse_layer_idx": true, + "scale_attn_weights": true, + "summary_activation": null, + "summary_first_dropout": 0.1, + "summary_proj_to_labels": true, + "summary_type": "cls_index", + "summary_use_proj": true, + "task_specific_params": { + "text-generation": { + "do_sample": true, + "max_length": 50 + } + }, + "torch_dtype": "float32", + "transformers_version": "4.12.2", + "use_cache": true, + "vocab_size": 32768 +} +loading weights file ./pytorch_model.bin +All model checkpoint weights were used when initializing GPT2LMHeadModel. +All the weights of GPT2LMHeadModel were initialized from the model checkpoint at ./. +If your task is similar to the task the model of the checkpoint was trained on, you can already use GPT2LMHeadModel for predictions without further training. +Didn't find file ./added_tokens.json. We won't load it. +loading file ./vocab.json +loading file ./merges.txt +loading file ./tokenizer.json +loading file None +loading file ./special_tokens_map.json +loading file ./tokenizer_config.json +11/06/2021 21:16:15 - INFO - datasets.data_files - Some files matched the pattern '*' at /home/leandro/codeparrot-clean-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/0b/f3/0bf3cd1320065c163f47a112458dc107650e3e862094b703b76073bd0b68663d'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/37/26/3726a0239b5cb7d0ef3ea36886c533d0becc7404217763015559edb546d53c94'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/e7/a9/e7a9ccbfe6bd92476f83eba205c47ed23732ace4c1bd7458d76d666ebbba3b1c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/73/73/737327c2b47693e00050aa3410c5eb402c66211a79740ab57f1c763a1e557563'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2a/7e/2a7e50bbdb90d6c4cec534c3f1dc7ec0e6a0dada15c07cfd94615940c632ce02'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5a/5f/5a5fbc19e0e76787f668ada7235203c10b0cbcdea0ecf8f873f8ec281cfe3494'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/74/31/7431977a8e3a6eb0348b821009495f85d9373c1f730f4a74b0db43326568f77d'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/50/38/503872def2ac44733fbefc2602ab16224caca0896aa1eba045025ef2d60efcdc'), PosixPath('/home/leandro/codeparrot-clean-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b6/ce/b6ce495492aedfc91b66efdfd214b2dfe44867c719d51590e1868e42f4e9b6dd'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/df/08/df0840d1657530c8fa9f82864be5999c515f54341d926c430a82528a6bb83740'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2f/62/2f628d890bceee216f87edb3c45d2e384ee2501ce41a4c4169efaa3363bef1d2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/0f/7a/0f7a67cd83c1c069995f0f2510ebf818dcc71d9658f189de1231d2b7aac8883c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/05/39/053944e1daead0b6de8e46ea2e0bc68b9247604c63a55d444ac3b9adb12e2cd2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/dc/ac/dcacb03d8f43f7879c5eab4422644d7b3797b47dbb0c9c84d88cbc85822d8306'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ac/e3/ace3ac440b380d604ab198cf8e838a2a375e7b0a6b5699ec74a8c79648f4bab8'), PosixPath('/home/leandro/codeparrot-clean-train/.git/description'), PosixPath('/home/leandro/codeparrot-clean-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/d4/9f/d49f1929644619c39cff677367ff2e18223a8046ec8f61e224954a10aa2ccf8f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2e/aa/2eaa21b832ed1496fb7f0b259666dbfc36ed483d81494d1e8705f9d601509c12'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/f1/a7/f1a7a250e1f6164a7fb602131ff54b69deb305258792f2358075403769d58fe5'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/d0/02/d0024828eece6d4d1c25cb4e539328be97fa28ce66a3b8d2374a117711cfd520'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/90/a5/90a573501de640c3e0e6f1b3508306febc96faf6061bb33c67894c168a1879c6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5d/42/5d42ba9f195510757a3699005a7c43ddede4b598caf8a5f2f8c84d1125fa6324'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5f/d1/5fd1bb56db810b65d1fd3866dc43d9c7b690c8f52b9ca8119b2a5f4c49d13eec'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/7c/0e/7c0ef87edb0e556939282c859c7c893a91b5b0f931394ca4cca4f4ec98a61951'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ee/c1/eec1a9546aac0444a706c09f6aab67cd64403940657417e30212b7ff1e16665c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/55/b6/55b6989a41ae296337356153e6081c61484d0b6734b6905683823e7317d01c42'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/cc/58/cc58b22515c4fd7d891287ee717c2054290b20c17b1c34693fd8964ab730687b'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b6/8a/b68a74f9784402dcb311f4db72a873035e47b98b185a1813ab2c1645cb7255a2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/fb/84/fb84ca8000808f62718994e4b44e79d88a05b345e9638d9f6cf6c8a5472da01f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/objects/pack/pack-12438cb8112d3b4104fefcb88d751872b5e0fd6e.pack'), PosixPath('/home/leandro/codeparrot-clean-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/12/8d/128d56e09d9d741b2778d733e595838a50a5e82fdc9adbb0aa8645457716b97e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/objects/pack/pack-12438cb8112d3b4104fefcb88d751872b5e0fd6e.idx'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b4/83/b4836655e350f0796acd2b1a206e657c2808d9f136afae095e0b94a790c704e1'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/3e/f2/3ef240d0b394384803ae1bbe3b30974e11eb9b1b6ad4f49afc2ed0f7c9eae0d6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/14/08/14089cad26037080ee900bede2fd42d5cac70738b2e77402b36681e1d2a521f6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/86/0e/860eda34e90456533e9dd41a5c0fdb74c54dc8d9cf43d6c60b887b2c858be831'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/15/ac/15ac016e4cd702bb184457cbf5674d71b632fc34c29611ba4de549b85c67acfb'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/a4/6b/a46b5c08d39691524b46fadf78eab5efefa29978edfee799ec3587d928dc1302'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/fa/e6/fae6b44a24c1c35f15053a19a6b2b2af5cc9fb8bdaf0da409068a2a1f333f28e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/17/5e/175e7375d6f65993071aa653bdd4e8b117cc02d1d2353cd7bcdbaaf7fe8b3c9c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ac/36/ac36d12d37c1dc8ee8d3b8f0eae93966ae73482ef725615bb1a715802ddd4dd4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/17/96/1796f12729d0407cc57500c9c87959e0e7becd729f37374702868ed8765015f4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/67/f1/67f1ff0d590fbf4aa9afa161c290fe9be17538d4b723278bb21fd6408b0e6a3e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/55/c9/55c9c0b2f26de96e0311ee43e8eaa78ad1af387d0c59a26f22c5ebd507dda321'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/config'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/9f/7e/9f7e18a3980d4b3d5ed9469ab7a2d67b608e8aa6fff38d876f86719c8f2a7a82'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/e6/48/e6484a578778beccab26c8549608ec13970e6bcdb9541cdccad20f4d984e8181'), PosixPath('/home/leandro/codeparrot-clean-train/.git/index'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/54/60/5460223b92bb118814a7777a939f4005b7426a7e4a068c193c10d1b86eeb862b'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ae/45/ae45741df674456bc63bad91374d2ba5ef988d33d6e2a322ef0a5ac8af040371'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/60/41/604177fe5560efd99d93091fadab6293afe7cd7d12f81638c301de1c937c1583'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ef/e1/efe1759837b74b5b5ed3df1a09d4c880f9ad20413d958f79d35bf1cb6a2a09d4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/32/be/32beb30e381ff02fb71854b5534306f395ef00f51f02b62da1f027c8c7fab26f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/9b/1b/9b1b8e52b9262f03f1719d3950dc8dfa2b9719dc2e273603023f6f329c1b2068'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/56/80/56803c607a19ccb576c90bdb10a02cfa7b3affc67dd150fa41b00cc22213b174'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/4e/39/4e392fcaae564652d234d07b4f71eeed90efe51b1b714831e39d77f3e537d3df'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/cd/33/cd339656799518495d23aedf1503459be6d3086e22672e80edab8403d12ded1c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/f1/62/f162b06b5dca01aa85ef9a675d396c0fbab1d009b5bee1c5b7ea6b415c6f12a4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-merge')] +Resolving data files: 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 53/53 [00:00<00:00, 196030.08it/s] +11/06/2021 21:16:15 - WARNING - datasets.builder - Using custom data configuration codeparrot-clean-train-e839c6c1585da466 +11/06/2021 21:16:15 - INFO - datasets.data_files - Some files matched the pattern '*' at /home/leandro/codeparrot-clean-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/60/0dc2964cf471fa4aac706659009777cf176497'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/95/7b2579c6ef20995a09efd9a17f8fd90606f5ed'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/config'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/index'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/25/747fcf966f2b7b3a2f4149130bff69ebe83718'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/15/4f5f07c68026fb069c4bdfe3966893737035f4'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/6d/d1188965fcd7feab0efc3506668a615805e13f'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/description'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/d9/cd7ad451bcd8a388471b341a961d0e6e6ff558'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/55/36bbd68dd8f283092b22eb77a051175c1b727a'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/lfs/objects/7f/8c/7f8c20a737c9084779bcdb853325ad4774d0db52c74aa2a63fd658d6787eb35b'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/09/e6a70d1aadc53ed29b9890332f184f89d0a39b'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/5e/d5325308cb9a07b2c5807dad51120c9a75b6db'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-receive.sample')] +11/06/2021 21:16:15 - WARNING - datasets.builder - Using custom data configuration codeparrot-clean-valid-ced470bd23403144 +Token indices sequence length is longer than the specified maximum sequence length for this model (1489 > 1024). Running this sequence through the model will result in indexing errors +11/06/2021 21:16:43 - INFO - __main__ - Step 1: {'lr': 0.0, 'samples': 192, 'steps': 0, 'loss/train': 10.55798625946045} +11/06/2021 21:16:43 - INFO - root - Reducer buckets have been rebuilt in this iteration. +11/06/2021 21:16:43 - INFO - __main__ - Step 2: {'lr': 2.5e-07, 'samples': 384, 'steps': 1, 'loss/train': 10.535750389099121} +11/06/2021 21:16:43 - INFO - __main__ - Step 3: {'lr': 5e-07, 'samples': 576, 'steps': 2, 'loss/train': 10.530282974243164} +11/06/2021 21:16:44 - INFO - __main__ - Step 4: {'lr': 7.5e-07, 'samples': 768, 'steps': 3, 'loss/train': 10.527787208557129} +11/06/2021 21:16:45 - INFO - __main__ - Step 5: {'lr': 1e-06, 'samples': 960, 'steps': 4, 'loss/train': 10.491048812866211} +11/06/2021 21:16:46 - INFO - __main__ - Step 6: {'lr': 1.25e-06, 'samples': 1152, 'steps': 5, 'loss/train': 10.409588813781738} +11/06/2021 21:16:46 - INFO - __main__ - Step 7: {'lr': 1.5e-06, 'samples': 1344, 'steps': 6, 'loss/train': 10.350728034973145} +11/06/2021 21:16:46 - INFO - __main__ - Step 8: {'lr': 1.75e-06, 'samples': 1536, 'steps': 7, 'loss/train': 10.252238273620605} +11/06/2021 21:16:47 - INFO - __main__ - Step 9: {'lr': 2e-06, 'samples': 1728, 'steps': 8, 'loss/train': 10.193534851074219} +11/06/2021 21:16:47 - INFO - __main__ - Step 10: {'lr': 2.25e-06, 'samples': 1920, 'steps': 9, 'loss/train': 9.953790664672852} +11/06/2021 21:16:48 - INFO - __main__ - Step 11: {'lr': 2.5e-06, 'samples': 2112, 'steps': 10, 'loss/train': 10.194929122924805} +11/06/2021 21:16:49 - INFO - __main__ - Step 12: {'lr': 2.75e-06, 'samples': 2304, 'steps': 11, 'loss/train': 9.89802074432373} +11/06/2021 21:16:49 - INFO - __main__ - Step 13: {'lr': 3e-06, 'samples': 2496, 'steps': 12, 'loss/train': 9.843729972839355} +11/06/2021 21:16:49 - INFO - __main__ - Step 14: {'lr': 3.25e-06, 'samples': 2688, 'steps': 13, 'loss/train': 9.845044136047363} +11/06/2021 21:16:50 - INFO - __main__ - Step 15: {'lr': 3.5e-06, 'samples': 2880, 'steps': 14, 'loss/train': 9.869210243225098} +11/06/2021 21:16:51 - INFO - __main__ - Step 16: {'lr': 3.75e-06, 'samples': 3072, 'steps': 15, 'loss/train': 9.587459564208984} +11/06/2021 21:16:51 - INFO - __main__ - Step 17: {'lr': 4e-06, 'samples': 3264, 'steps': 16, 'loss/train': 9.667202949523926} +11/06/2021 21:16:51 - INFO - __main__ - Step 18: {'lr': 4.250000000000001e-06, 'samples': 3456, 'steps': 17, 'loss/train': 9.495230674743652} +11/06/2021 21:16:52 - INFO - __main__ - Step 19: {'lr': 4.5e-06, 'samples': 3648, 'steps': 18, 'loss/train': 9.640376091003418} +11/06/2021 21:16:52 - INFO - __main__ - Step 20: {'lr': 4.75e-06, 'samples': 3840, 'steps': 19, 'loss/train': 9.428448677062988} +11/06/2021 21:16:52 - INFO - __main__ - Step 21: {'lr': 5e-06, 'samples': 4032, 'steps': 20, 'loss/train': 9.341026306152344} +11/06/2021 21:16:54 - INFO - __main__ - Step 22: {'lr': 5.2500000000000006e-06, 'samples': 4224, 'steps': 21, 'loss/train': 9.372577667236328} +11/06/2021 21:16:54 - INFO - __main__ - Step 23: {'lr': 5.5e-06, 'samples': 4416, 'steps': 22, 'loss/train': 8.967851638793945} +11/06/2021 21:16:54 - INFO - __main__ - Step 24: {'lr': 5.75e-06, 'samples': 4608, 'steps': 23, 'loss/train': 8.74506950378418} +11/06/2021 21:16:55 - INFO - __main__ - Step 25: {'lr': 6e-06, 'samples': 4800, 'steps': 24, 'loss/train': 9.786674499511719} +11/06/2021 21:16:55 - INFO - __main__ - Step 26: {'lr': 6.25e-06, 'samples': 4992, 'steps': 25, 'loss/train': 9.504456520080566} +11/06/2021 21:16:56 - INFO - __main__ - Step 27: {'lr': 6.5e-06, 'samples': 5184, 'steps': 26, 'loss/train': 9.166744232177734} +11/06/2021 21:16:56 - INFO - __main__ - Step 28: {'lr': 6.75e-06, 'samples': 5376, 'steps': 27, 'loss/train': 8.682860374450684} +11/06/2021 21:16:57 - INFO - __main__ - Step 29: {'lr': 7e-06, 'samples': 5568, 'steps': 28, 'loss/train': 8.596318244934082} +11/06/2021 21:16:57 - INFO - __main__ - Step 30: {'lr': 7.250000000000001e-06, 'samples': 5760, 'steps': 29, 'loss/train': 9.048979759216309} +11/06/2021 21:16:57 - INFO - __main__ - Step 31: {'lr': 7.5e-06, 'samples': 5952, 'steps': 30, 'loss/train': 9.320890426635742} +11/06/2021 21:16:58 - INFO - __main__ - Step 32: {'lr': 7.75e-06, 'samples': 6144, 'steps': 31, 'loss/train': 8.952228546142578} +11/06/2021 21:16:59 - INFO - __main__ - Step 33: {'lr': 8e-06, 'samples': 6336, 'steps': 32, 'loss/train': 8.751225471496582} +11/06/2021 21:16:59 - INFO - __main__ - Step 34: {'lr': 8.25e-06, 'samples': 6528, 'steps': 33, 'loss/train': 9.156981468200684} +11/06/2021 21:17:00 - INFO - __main__ - Step 35: {'lr': 8.500000000000002e-06, 'samples': 6720, 'steps': 34, 'loss/train': 8.837956428527832} +11/06/2021 21:17:00 - INFO - __main__ - Step 36: {'lr': 8.750000000000001e-06, 'samples': 6912, 'steps': 35, 'loss/train': 8.935142517089844} +11/06/2021 21:17:01 - INFO - __main__ - Step 37: {'lr': 9e-06, 'samples': 7104, 'steps': 36, 'loss/train': 9.019933700561523} +11/06/2021 21:17:02 - INFO - __main__ - Step 38: {'lr': 9.25e-06, 'samples': 7296, 'steps': 37, 'loss/train': 8.594483375549316} +11/06/2021 21:17:02 - INFO - __main__ - Step 39: {'lr': 9.5e-06, 'samples': 7488, 'steps': 38, 'loss/train': 9.565625190734863} +11/06/2021 21:17:02 - INFO - __main__ - Step 40: {'lr': 9.75e-06, 'samples': 7680, 'steps': 39, 'loss/train': 9.195219039916992} +11/06/2021 21:17:03 - INFO - __main__ - Step 41: {'lr': 1e-05, 'samples': 7872, 'steps': 40, 'loss/train': 9.008049011230469} +11/06/2021 21:17:04 - INFO - __main__ - Step 42: {'lr': 1.025e-05, 'samples': 8064, 'steps': 41, 'loss/train': 9.54212760925293} +11/06/2021 21:17:04 - INFO - __main__ - Step 43: {'lr': 1.0500000000000001e-05, 'samples': 8256, 'steps': 42, 'loss/train': 9.074606895446777} +11/06/2021 21:17:04 - INFO - __main__ - Step 44: {'lr': 1.0749999999999999e-05, 'samples': 8448, 'steps': 43, 'loss/train': 9.575305938720703} +11/06/2021 21:17:05 - INFO - __main__ - Step 45: {'lr': 1.1e-05, 'samples': 8640, 'steps': 44, 'loss/train': 9.862631797790527} +11/06/2021 21:17:05 - INFO - __main__ - Step 46: {'lr': 1.1249999999999999e-05, 'samples': 8832, 'steps': 45, 'loss/train': 8.833338737487793} +11/06/2021 21:17:06 - INFO - __main__ - Step 47: {'lr': 1.15e-05, 'samples': 9024, 'steps': 46, 'loss/train': 8.830769538879395} +11/06/2021 21:17:07 - INFO - __main__ - Step 48: {'lr': 1.1750000000000001e-05, 'samples': 9216, 'steps': 47, 'loss/train': 8.828520774841309} +11/06/2021 21:17:07 - INFO - __main__ - Step 49: {'lr': 1.2e-05, 'samples': 9408, 'steps': 48, 'loss/train': 8.692312240600586} +11/06/2021 21:17:07 - INFO - __main__ - Step 50: {'lr': 1.2250000000000001e-05, 'samples': 9600, 'steps': 49, 'loss/train': 8.698874473571777} +11/06/2021 21:17:08 - INFO - __main__ - Step 51: {'lr': 1.25e-05, 'samples': 9792, 'steps': 50, 'loss/train': 8.904641151428223} +11/06/2021 21:17:09 - INFO - __main__ - Step 52: {'lr': 1.275e-05, 'samples': 9984, 'steps': 51, 'loss/train': 8.66476821899414} +11/06/2021 21:17:09 - INFO - __main__ - Step 53: {'lr': 1.3e-05, 'samples': 10176, 'steps': 52, 'loss/train': 8.561541557312012} +11/06/2021 21:17:10 - INFO - __main__ - Step 54: {'lr': 1.325e-05, 'samples': 10368, 'steps': 53, 'loss/train': 8.71354866027832} +11/06/2021 21:17:10 - INFO - __main__ - Step 55: {'lr': 1.35e-05, 'samples': 10560, 'steps': 54, 'loss/train': 8.084650993347168} +11/06/2021 21:17:10 - INFO - __main__ - Step 56: {'lr': 1.375e-05, 'samples': 10752, 'steps': 55, 'loss/train': 8.701323509216309} +11/06/2021 21:17:11 - INFO - __main__ - Step 57: {'lr': 1.4e-05, 'samples': 10944, 'steps': 56, 'loss/train': 8.886054039001465} +11/06/2021 21:17:12 - INFO - __main__ - Step 58: {'lr': 1.425e-05, 'samples': 11136, 'steps': 57, 'loss/train': 8.962408065795898} +11/06/2021 21:17:12 - INFO - __main__ - Step 59: {'lr': 1.4500000000000002e-05, 'samples': 11328, 'steps': 58, 'loss/train': 8.731340408325195} +11/06/2021 21:17:13 - INFO - __main__ - Step 60: {'lr': 1.475e-05, 'samples': 11520, 'steps': 59, 'loss/train': 8.48225212097168} +11/06/2021 21:17:13 - INFO - __main__ - Step 61: {'lr': 1.5e-05, 'samples': 11712, 'steps': 60, 'loss/train': 8.860502243041992} +11/06/2021 21:17:14 - INFO - __main__ - Step 62: {'lr': 1.525e-05, 'samples': 11904, 'steps': 61, 'loss/train': 8.848859786987305} +11/06/2021 21:17:15 - INFO - __main__ - Step 63: {'lr': 1.55e-05, 'samples': 12096, 'steps': 62, 'loss/train': 8.20711612701416} +11/06/2021 21:17:15 - INFO - __main__ - Step 64: {'lr': 1.575e-05, 'samples': 12288, 'steps': 63, 'loss/train': 10.296394348144531} +11/06/2021 21:17:15 - INFO - __main__ - Step 65: {'lr': 1.6e-05, 'samples': 12480, 'steps': 64, 'loss/train': 7.71311092376709} +11/06/2021 21:17:16 - INFO - __main__ - Step 66: {'lr': 1.6250000000000002e-05, 'samples': 12672, 'steps': 65, 'loss/train': 8.466562271118164} +11/06/2021 21:17:16 - INFO - __main__ - Step 67: {'lr': 1.65e-05, 'samples': 12864, 'steps': 66, 'loss/train': 8.35257339477539} +11/06/2021 21:17:17 - INFO - __main__ - Step 68: {'lr': 1.675e-05, 'samples': 13056, 'steps': 67, 'loss/train': 8.386396408081055} +11/06/2021 21:17:18 - INFO - __main__ - Step 69: {'lr': 1.7000000000000003e-05, 'samples': 13248, 'steps': 68, 'loss/train': 8.12002944946289} +11/06/2021 21:17:18 - INFO - __main__ - Step 70: {'lr': 1.7250000000000003e-05, 'samples': 13440, 'steps': 69, 'loss/train': 8.70462417602539} +11/06/2021 21:17:18 - INFO - __main__ - Step 71: {'lr': 1.7500000000000002e-05, 'samples': 13632, 'steps': 70, 'loss/train': 8.239697456359863} +11/06/2021 21:17:19 - INFO - __main__ - Step 72: {'lr': 1.7749999999999998e-05, 'samples': 13824, 'steps': 71, 'loss/train': 7.610179424285889} +11/06/2021 21:17:20 - INFO - __main__ - Step 73: {'lr': 1.8e-05, 'samples': 14016, 'steps': 72, 'loss/train': 7.8869452476501465} +11/06/2021 21:17:20 - INFO - __main__ - Step 74: {'lr': 1.825e-05, 'samples': 14208, 'steps': 73, 'loss/train': 7.692283630371094} +11/06/2021 21:17:21 - INFO - __main__ - Step 75: {'lr': 1.85e-05, 'samples': 14400, 'steps': 74, 'loss/train': 8.208292007446289} +11/06/2021 21:17:21 - INFO - __main__ - Step 76: {'lr': 1.875e-05, 'samples': 14592, 'steps': 75, 'loss/train': 7.97852897644043} +11/06/2021 21:17:21 - INFO - __main__ - Step 77: {'lr': 1.9e-05, 'samples': 14784, 'steps': 76, 'loss/train': 8.777739524841309} +11/06/2021 21:17:22 - INFO - __main__ - Step 78: {'lr': 1.925e-05, 'samples': 14976, 'steps': 77, 'loss/train': 7.68981409072876} +11/06/2021 21:17:23 - INFO - __main__ - Step 79: {'lr': 1.95e-05, 'samples': 15168, 'steps': 78, 'loss/train': 7.656458854675293} +11/06/2021 21:17:23 - INFO - __main__ - Step 80: {'lr': 1.975e-05, 'samples': 15360, 'steps': 79, 'loss/train': 8.30695915222168} +11/06/2021 21:17:23 - INFO - __main__ - Step 81: {'lr': 2e-05, 'samples': 15552, 'steps': 80, 'loss/train': 7.897383689880371} +11/06/2021 21:17:25 - INFO - __main__ - Step 83: {'lr': 2.05e-05, 'samples': 15936, 'steps': 82, 'loss/train': 8.247127532958984} +11/06/2021 21:17:25 - INFO - __main__ - Step 84: {'lr': 2.0750000000000003e-05, 'samples': 16128, 'steps': 83, 'loss/train': 8.18776798248291} +11/06/2021 21:17:25 - INFO - __main__ - Step 85: {'lr': 2.1000000000000002e-05, 'samples': 16320, 'steps': 84, 'loss/train': 7.7213358879089355} +11/06/2021 21:17:26 - INFO - __main__ - Step 86: {'lr': 2.125e-05, 'samples': 16512, 'steps': 85, 'loss/train': 7.880347728729248} +11/06/2021 21:17:27 - INFO - __main__ - Step 88: {'lr': 2.175e-05, 'samples': 16896, 'steps': 87, 'loss/train': 7.1267242431640625} +11/06/2021 21:17:27 - INFO - __main__ - Step 89: {'lr': 2.2e-05, 'samples': 17088, 'steps': 88, 'loss/train': 7.992337703704834} +11/06/2021 21:17:29 - INFO - __main__ - Step 92: {'lr': 2.275e-05, 'samples': 17664, 'steps': 91, 'loss/train': 7.861474990844727}650268554688} +11/06/2021 21:17:29 - INFO - __main__ - Step 93: {'lr': 2.3e-05, 'samples': 17856, 'steps': 92, 'loss/train': 7.493942737579346} +11/06/2021 21:17:31 - INFO - __main__ - Step 98: {'lr': 2.425e-05, 'samples': 18816, 'steps': 97, 'loss/train': 7.735995292663574}650268554688} +11/06/2021 21:17:31 - INFO - __main__ - Step 98: {'lr': 2.425e-05, 'samples': 18816, 'steps': 97, 'loss/train': 7.735995292663574}650268554688} +11/06/2021 21:17:35 - INFO - __main__ - Step 104: {'lr': 2.575e-05, 'samples': 19968, 'steps': 103, 'loss/train': 7.325517654418945}0268554688} +11/06/2021 21:17:38 - INFO - __main__ - Step 110: {'lr': 2.725e-05, 'samples': 21120, 'steps': 109, 'loss/train': 8.008770942687988}0268554688} +11/06/2021 21:17:38 - INFO - __main__ - Step 110: {'lr': 2.725e-05, 'samples': 21120, 'steps': 109, 'loss/train': 8.008770942687988}0268554688} +11/06/2021 21:17:41 - INFO - __main__ - Step 116: {'lr': 2.875e-05, 'samples': 22272, 'steps': 115, 'loss/train': 7.741561412811279}0268554688} +11/06/2021 21:17:43 - INFO - __main__ - Step 122: {'lr': 3.025e-05, 'samples': 23424, 'steps': 121, 'loss/train': 6.9648213386535645}268554688} +11/06/2021 21:17:43 - INFO - __main__ - Step 122: {'lr': 3.025e-05, 'samples': 23424, 'steps': 121, 'loss/train': 6.9648213386535645}268554688} +11/06/2021 21:17:47 - INFO - __main__ - Step 128: {'lr': 3.175e-05, 'samples': 24576, 'steps': 127, 'loss/train': 7.172966003417969}}268554688} +11/06/2021 21:17:49 - INFO - __main__ - Step 134: {'lr': 3.325e-05, 'samples': 25728, 'steps': 133, 'loss/train': 7.035802841186523}}268554688} +11/06/2021 21:17:49 - INFO - __main__ - Step 134: {'lr': 3.325e-05, 'samples': 25728, 'steps': 133, 'loss/train': 7.035802841186523}}268554688} +11/06/2021 21:17:53 - INFO - __main__ - Step 140: {'lr': 3.4750000000000004e-05, 'samples': 26880, 'steps': 139, 'loss/train': 6.972182273864746} +11/06/2021 21:17:56 - INFO - __main__ - Step 146: {'lr': 3.625e-05, 'samples': 28032, 'steps': 145, 'loss/train': 7.03615140914917}2182273864746} +11/06/2021 21:17:56 - INFO - __main__ - Step 146: {'lr': 3.625e-05, 'samples': 28032, 'steps': 145, 'loss/train': 7.03615140914917}2182273864746} +11/06/2021 21:17:59 - INFO - __main__ - Step 152: {'lr': 3.775e-05, 'samples': 29184, 'steps': 151, 'loss/train': 6.523715019226074}182273864746} +11/06/2021 21:18:01 - INFO - __main__ - Step 158: {'lr': 3.925e-05, 'samples': 30336, 'steps': 157, 'loss/train': 6.675495624542236}182273864746} +11/06/2021 21:18:04 - INFO - __main__ - Step 164: {'lr': 4.075e-05, 'samples': 31488, 'steps': 163, 'loss/train': 6.836953163146973}182273864746} +11/06/2021 21:18:04 - INFO - __main__ - Step 164: {'lr': 4.075e-05, 'samples': 31488, 'steps': 163, 'loss/train': 6.836953163146973}182273864746} +11/06/2021 21:18:08 - INFO - __main__ - Step 170: {'lr': 4.2250000000000004e-05, 'samples': 32640, 'steps': 169, 'loss/train': 7.073266506195068} +11/06/2021 21:18:08 - INFO - __main__ - Step 170: {'lr': 4.2250000000000004e-05, 'samples': 32640, 'steps': 169, 'loss/train': 7.073266506195068} +11/06/2021 21:18:11 - INFO - __main__ - Step 176: {'lr': 4.375e-05, 'samples': 33792, 'steps': 175, 'loss/train': 7.043330192565918}266506195068} +11/06/2021 21:18:13 - INFO - __main__ - Step 182: {'lr': 4.525e-05, 'samples': 34944, 'steps': 181, 'loss/train': 6.373216152191162}266506195068} +11/06/2021 21:18:13 - INFO - __main__ - Step 182: {'lr': 4.525e-05, 'samples': 34944, 'steps': 181, 'loss/train': 6.373216152191162}266506195068} +11/06/2021 21:18:16 - INFO - __main__ - Step 188: {'lr': 4.675e-05, 'samples': 36096, 'steps': 187, 'loss/train': 5.526083469390869}266506195068} +11/06/2021 21:18:19 - INFO - __main__ - Step 194: {'lr': 4.825e-05, 'samples': 37248, 'steps': 193, 'loss/train': 6.355683326721191}266506195068} +11/06/2021 21:18:22 - INFO - __main__ - Step 200: {'lr': 4.975e-05, 'samples': 38400, 'steps': 199, 'loss/train': 6.113000392913818}266506195068} +11/06/2021 21:18:22 - INFO - __main__ - Step 200: {'lr': 4.975e-05, 'samples': 38400, 'steps': 199, 'loss/train': 6.113000392913818}266506195068} +11/06/2021 21:18:25 - INFO - __main__ - Step 206: {'lr': 5.125e-05, 'samples': 39552, 'steps': 205, 'loss/train': 5.817543029785156}266506195068} +11/06/2021 21:18:28 - INFO - __main__ - Step 212: {'lr': 5.275e-05, 'samples': 40704, 'steps': 211, 'loss/train': 5.677988529205322}266506195068} +11/06/2021 21:18:28 - INFO - __main__ - Step 212: {'lr': 5.275e-05, 'samples': 40704, 'steps': 211, 'loss/train': 5.677988529205322}266506195068} +11/06/2021 21:18:31 - INFO - __main__ - Step 218: {'lr': 5.4250000000000004e-05, 'samples': 41856, 'steps': 217, 'loss/train': 6.029814720153809} +11/06/2021 21:18:34 - INFO - __main__ - Step 224: {'lr': 5.575e-05, 'samples': 43008, 'steps': 223, 'loss/train': 6.467023849487305}814720153809} +11/06/2021 21:18:34 - INFO - __main__ - Step 224: {'lr': 5.575e-05, 'samples': 43008, 'steps': 223, 'loss/train': 6.467023849487305}814720153809} +11/06/2021 21:18:37 - INFO - __main__ - Step 230: {'lr': 5.725e-05, 'samples': 44160, 'steps': 229, 'loss/train': 5.728048324584961}814720153809} +11/06/2021 21:18:39 - INFO - __main__ - Step 236: {'lr': 5.875e-05, 'samples': 45312, 'steps': 235, 'loss/train': 6.2582688331604}1}814720153809} +11/06/2021 21:18:42 - INFO - __main__ - Step 242: {'lr': 6.025e-05, 'samples': 46464, 'steps': 241, 'loss/train': 6.203149318695068}814720153809} +11/06/2021 21:18:42 - INFO - __main__ - Step 242: {'lr': 6.025e-05, 'samples': 46464, 'steps': 241, 'loss/train': 6.203149318695068}814720153809} +11/06/2021 21:18:45 - INFO - __main__ - Step 248: {'lr': 6.175e-05, 'samples': 47616, 'steps': 247, 'loss/train': 5.754123210906982}814720153809} +11/06/2021 21:18:45 - INFO - __main__ - Step 248: {'lr': 6.175e-05, 'samples': 47616, 'steps': 247, 'loss/train': 5.754123210906982}814720153809} +11/06/2021 21:18:49 - INFO - __main__ - Step 254: {'lr': 6.325e-05, 'samples': 48768, 'steps': 253, 'loss/train': 5.7925004959106445}14720153809} +11/06/2021 21:18:52 - INFO - __main__ - Step 260: {'lr': 6.475e-05, 'samples': 49920, 'steps': 259, 'loss/train': 3.9729881286621094}14720153809} +11/06/2021 21:18:55 - INFO - __main__ - Step 266: {'lr': 6.625000000000001e-05, 'samples': 51072, 'steps': 265, 'loss/train': 6.112322807312012}} +11/06/2021 21:18:55 - INFO - __main__ - Step 266: {'lr': 6.625000000000001e-05, 'samples': 51072, 'steps': 265, 'loss/train': 6.112322807312012}} +11/06/2021 21:18:57 - INFO - __main__ - Step 272: {'lr': 6.775000000000001e-05, 'samples': 52224, 'steps': 271, 'loss/train': 5.43068790435791}}} +11/06/2021 21:19:00 - INFO - __main__ - Step 278: {'lr': 6.925e-05, 'samples': 53376, 'steps': 277, 'loss/train': 5.7302045822143555}790435791}}} +11/06/2021 21:19:00 - INFO - __main__ - Step 278: {'lr': 6.925e-05, 'samples': 53376, 'steps': 277, 'loss/train': 5.7302045822143555}790435791}}} +11/06/2021 21:19:03 - INFO - __main__ - Step 284: {'lr': 7.075e-05, 'samples': 54528, 'steps': 283, 'loss/train': 5.200248718261719}}790435791}}} +11/06/2021 21:19:06 - INFO - __main__ - Step 290: {'lr': 7.225e-05, 'samples': 55680, 'steps': 289, 'loss/train': 6.18521785736084}}}790435791}}} +11/06/2021 21:19:06 - INFO - __main__ - Step 290: {'lr': 7.225e-05, 'samples': 55680, 'steps': 289, 'loss/train': 6.18521785736084}}}790435791}}} +11/06/2021 21:19:09 - INFO - __main__ - Step 296: {'lr': 7.375e-05, 'samples': 56832, 'steps': 295, 'loss/train': 5.397673606872559}}790435791}}} +11/06/2021 21:19:12 - INFO - __main__ - Step 302: {'lr': 7.525e-05, 'samples': 57984, 'steps': 301, 'loss/train': 5.377347469329834}}790435791}}} +11/06/2021 21:19:15 - INFO - __main__ - Step 307: {'lr': 7.65e-05, 'samples': 58944, 'steps': 306, 'loss/train': 5.420361518859863}}}790435791}}} +11/06/2021 21:19:15 - INFO - __main__ - Step 307: {'lr': 7.65e-05, 'samples': 58944, 'steps': 306, 'loss/train': 5.420361518859863}}}790435791}}} +11/06/2021 21:19:18 - INFO - __main__ - Step 314: {'lr': 7.825e-05, 'samples': 60288, 'steps': 313, 'loss/train': 5.498117923736572}}790435791}}} +11/06/2021 21:19:21 - INFO - __main__ - Step 320: {'lr': 7.975e-05, 'samples': 61440, 'steps': 319, 'loss/train': 5.5839314460754395}790435791}}} +11/06/2021 21:19:21 - INFO - __main__ - Step 320: {'lr': 7.975e-05, 'samples': 61440, 'steps': 319, 'loss/train': 5.5839314460754395}790435791}}} +11/06/2021 21:19:24 - INFO - __main__ - Step 327: {'lr': 8.15e-05, 'samples': 62784, 'steps': 326, 'loss/train': 5.665132522583008}5}790435791}}} +11/06/2021 21:19:26 - INFO - __main__ - Step 331: {'lr': 8.25e-05, 'samples': 63552, 'steps': 330, 'loss/train': 5.495372295379639}5}790435791}}} +11/06/2021 21:19:28 - INFO - __main__ - Step 335: {'lr': 8.350000000000001e-05, 'samples': 64320, 'steps': 334, 'loss/train': 5.6893181800842285} +11/06/2021 21:19:30 - INFO - __main__ - Step 340: {'lr': 8.475000000000001e-05, 'samples': 65280, 'steps': 339, 'loss/train': 5.477786540985107}} +11/06/2021 21:19:33 - INFO - __main__ - Step 344: {'lr': 8.575000000000001e-05, 'samples': 66048, 'steps': 343, 'loss/train': 5.646244525909424}} +11/06/2021 21:19:35 - INFO - __main__ - Step 348: {'lr': 8.675e-05, 'samples': 66816, 'steps': 347, 'loss/train': 5.6107988357543945}4525909424}} +11/06/2021 21:19:36 - INFO - __main__ - Step 352: {'lr': 8.774999999999999e-05, 'samples': 67584, 'steps': 351, 'loss/train': 6.211921215057373}} +11/06/2021 21:19:38 - INFO - __main__ - Step 356: {'lr': 8.875e-05, 'samples': 68352, 'steps': 355, 'loss/train': 5.443009853363037}21215057373}} +11/06/2021 21:19:41 - INFO - __main__ - Step 361: {'lr': 8.999999999999999e-05, 'samples': 69312, 'steps': 360, 'loss/train': 7.289037227630615}} +11/06/2021 21:19:43 - INFO - __main__ - Step 365: {'lr': 9.1e-05, 'samples': 70080, 'steps': 364, 'loss/train': 5.4572978019714355}037227630615}} +11/06/2021 21:19:45 - INFO - __main__ - Step 369: {'lr': 9.2e-05, 'samples': 70848, 'steps': 368, 'loss/train': 5.474288463592529}}037227630615}} +11/06/2021 21:19:46 - INFO - __main__ - Step 373: {'lr': 9.3e-05, 'samples': 71616, 'steps': 372, 'loss/train': 5.273648262023926}}037227630615}} +11/06/2021 21:19:48 - INFO - __main__ - Step 377: {'lr': 9.400000000000001e-05, 'samples': 72384, 'steps': 376, 'loss/train': 5.5180864334106445} +11/06/2021 21:19:51 - INFO - __main__ - Step 382: {'lr': 9.525e-05, 'samples': 73344, 'steps': 381, 'loss/train': 5.458894729614258}864334106445} +11/06/2021 21:19:51 - INFO - __main__ - Step 382: {'lr': 9.525e-05, 'samples': 73344, 'steps': 381, 'loss/train': 5.458894729614258}864334106445} +11/06/2021 21:19:55 - INFO - __main__ - Step 389: {'lr': 9.7e-05, 'samples': 74688, 'steps': 388, 'loss/train': 5.781015396118164}8}864334106445} +11/06/2021 21:19:56 - INFO - __main__ - Step 393: {'lr': 9.800000000000001e-05, 'samples': 75456, 'steps': 392, 'loss/train': 5.350080966949463}} +11/06/2021 21:19:58 - INFO - __main__ - Step 397: {'lr': 9.900000000000001e-05, 'samples': 76224, 'steps': 396, 'loss/train': 5.724830150604248}} +11/06/2021 21:20:01 - INFO - __main__ - Step 402: {'lr': 0.00010025000000000001, 'samples': 77184, 'steps': 401, 'loss/train': 5.318662166595459} +11/06/2021 21:20:03 - INFO - __main__ - Step 406: {'lr': 0.00010125000000000001, 'samples': 77952, 'steps': 405, 'loss/train': 5.227279186248779} +11/06/2021 21:20:05 - INFO - __main__ - Step 410: {'lr': 0.00010224999999999999, 'samples': 78720, 'steps': 409, 'loss/train': 5.491655349731445} +11/06/2021 21:20:06 - INFO - __main__ - Step 414: {'lr': 0.00010325, 'samples': 79488, 'steps': 413, 'loss/train': 5.201007843017578}55349731445} +11/06/2021 21:20:08 - INFO - __main__ - Step 418: {'lr': 0.00010425, 'samples': 80256, 'steps': 417, 'loss/train': 5.490600109100342}55349731445} +11/06/2021 21:20:11 - INFO - __main__ - Step 423: {'lr': 0.0001055, 'samples': 81216, 'steps': 422, 'loss/train': 5.291647434234619}}55349731445} +11/06/2021 21:20:13 - INFO - __main__ - Step 427: {'lr': 0.0001065, 'samples': 81984, 'steps': 426, 'loss/train': 5.437173366546631}}55349731445} +11/06/2021 21:20:15 - INFO - __main__ - Step 431: {'lr': 0.0001075, 'samples': 82752, 'steps': 430, 'loss/train': 4.334190845489502}}55349731445} +11/06/2021 21:20:16 - INFO - __main__ - Step 435: {'lr': 0.00010850000000000001, 'samples': 83520, 'steps': 434, 'loss/train': 5.3725810050964355} +11/06/2021 21:20:18 - INFO - __main__ - Step 439: {'lr': 0.0001095, 'samples': 84288, 'steps': 438, 'loss/train': 5.41857385635376}25810050964355} +11/06/2021 21:20:18 - INFO - __main__ - Step 439: {'lr': 0.0001095, 'samples': 84288, 'steps': 438, 'loss/train': 5.41857385635376}25810050964355} +11/06/2021 21:20:23 - INFO - __main__ - Step 447: {'lr': 0.0001115, 'samples': 85824, 'steps': 446, 'loss/train': 5.4635491371154785}810050964355} +11/06/2021 21:20:25 - INFO - __main__ - Step 451: {'lr': 0.00011250000000000001, 'samples': 86592, 'steps': 450, 'loss/train': 4.955085754394531}} +11/06/2021 21:20:26 - INFO - __main__ - Step 455: {'lr': 0.00011350000000000001, 'samples': 87360, 'steps': 454, 'loss/train': 4.927133083343506}} +11/06/2021 21:20:29 - INFO - __main__ - Step 459: {'lr': 0.0001145, 'samples': 88128, 'steps': 458, 'loss/train': 6.301289081573486}133083343506}} +11/06/2021 21:20:31 - INFO - __main__ - Step 464: {'lr': 0.00011575000000000001, 'samples': 89088, 'steps': 463, 'loss/train': 4.844412326812744}} +11/06/2021 21:20:33 - INFO - __main__ - Step 468: {'lr': 0.00011675, 'samples': 89856, 'steps': 467, 'loss/train': 5.613701820373535}12326812744}} +11/06/2021 21:20:33 - INFO - __main__ - Step 468: {'lr': 0.00011675, 'samples': 89856, 'steps': 467, 'loss/train': 5.613701820373535}12326812744}} +11/06/2021 21:20:36 - INFO - __main__ - Step 475: {'lr': 0.0001185, 'samples': 91200, 'steps': 474, 'loss/train': 5.4914021492004395}12326812744}} +11/06/2021 21:20:39 - INFO - __main__ - Step 480: {'lr': 0.00011975, 'samples': 92160, 'steps': 479, 'loss/train': 5.236664295196533}12326812744}} +11/06/2021 21:20:39 - INFO - __main__ - Step 480: {'lr': 0.00011975, 'samples': 92160, 'steps': 479, 'loss/train': 5.236664295196533}12326812744}} +11/06/2021 21:20:43 - INFO - __main__ - Step 488: {'lr': 0.00012175, 'samples': 93696, 'steps': 487, 'loss/train': 5.1655683517456055}2326812744}} +11/06/2021 21:20:45 - INFO - __main__ - Step 492: {'lr': 0.00012275, 'samples': 94464, 'steps': 491, 'loss/train': 5.145169734954834}}2326812744}} +11/06/2021 21:20:47 - INFO - __main__ - Step 496: {'lr': 0.00012375, 'samples': 95232, 'steps': 495, 'loss/train': 4.821667194366455}}2326812744}} +11/06/2021 21:20:49 - INFO - __main__ - Step 501: {'lr': 0.000125, 'samples': 96192, 'steps': 500, 'loss/train': 5.50537109375}66455}}2326812744}} +11/06/2021 21:20:51 - INFO - __main__ - Step 505: {'lr': 0.000126, 'samples': 96960, 'steps': 504, 'loss/train': 5.220231056213379}5}}2326812744}} +11/06/2021 21:20:51 - INFO - __main__ - Step 505: {'lr': 0.000126, 'samples': 96960, 'steps': 504, 'loss/train': 5.220231056213379}5}}2326812744}} +11/06/2021 21:20:55 - INFO - __main__ - Step 512: {'lr': 0.00012775000000000002, 'samples': 98304, 'steps': 511, 'loss/train': 5.125716686248779}} +11/06/2021 21:20:57 - INFO - __main__ - Step 516: {'lr': 0.00012875, 'samples': 99072, 'steps': 515, 'loss/train': 5.111538410186768}16686248779}} +11/06/2021 21:20:59 - INFO - __main__ - Step 520: {'lr': 0.00012975, 'samples': 99840, 'steps': 519, 'loss/train': 4.82402229309082}}16686248779}} +11/06/2021 21:20:59 - INFO - __main__ - Step 520: {'lr': 0.00012975, 'samples': 99840, 'steps': 519, 'loss/train': 4.82402229309082}}16686248779}} +11/06/2021 21:21:03 - INFO - __main__ - Step 527: {'lr': 0.0001315, 'samples': 101184, 'steps': 526, 'loss/train': 5.979576587677002}16686248779}} +11/06/2021 21:21:05 - INFO - __main__ - Step 531: {'lr': 0.00013250000000000002, 'samples': 101952, 'steps': 530, 'loss/train': 4.945707321166992} +11/06/2021 21:21:05 - INFO - __main__ - Step 531: {'lr': 0.00013250000000000002, 'samples': 101952, 'steps': 530, 'loss/train': 4.945707321166992} +11/06/2021 21:21:05 - INFO - __main__ - Step 531: {'lr': 0.00013250000000000002, 'samples': 101952, 'steps': 530, 'loss/train': 4.945707321166992} +11/06/2021 21:21:10 - INFO - __main__ - Step 542: {'lr': 0.00013525, 'samples': 104064, 'steps': 541, 'loss/train': 6.563281059265137}07321166992} +11/06/2021 21:21:13 - INFO - __main__ - Step 547: {'lr': 0.0001365, 'samples': 105024, 'steps': 546, 'loss/train': 5.063644886016846}}07321166992} +11/06/2021 21:21:15 - INFO - __main__ - Step 551: {'lr': 0.0001375, 'samples': 105792, 'steps': 550, 'loss/train': 5.3217949867248535}07321166992} +11/06/2021 21:21:17 - INFO - __main__ - Step 555: {'lr': 0.0001385, 'samples': 106560, 'steps': 554, 'loss/train': 1.4391024112701416}07321166992} +11/06/2021 21:21:18 - INFO - __main__ - Step 559: {'lr': 0.0001395, 'samples': 107328, 'steps': 558, 'loss/train': 5.34543514251709}6}07321166992} +11/06/2021 21:21:20 - INFO - __main__ - Step 563: {'lr': 0.00014050000000000003, 'samples': 108096, 'steps': 562, 'loss/train': 5.075902462005615} +11/06/2021 21:21:23 - INFO - __main__ - Step 568: {'lr': 0.00014175, 'samples': 109056, 'steps': 567, 'loss/train': 5.004296779632568}02462005615} +11/06/2021 21:21:23 - INFO - __main__ - Step 568: {'lr': 0.00014175, 'samples': 109056, 'steps': 567, 'loss/train': 5.004296779632568}02462005615} +11/06/2021 21:21:23 - INFO - __main__ - Step 568: {'lr': 0.00014175, 'samples': 109056, 'steps': 567, 'loss/train': 5.004296779632568}02462005615} +11/06/2021 21:21:28 - INFO - __main__ - Step 578: {'lr': 0.00014424999999999998, 'samples': 110976, 'steps': 577, 'loss/train': 4.281363487243652} +11/06/2021 21:21:31 - INFO - __main__ - Step 583: {'lr': 0.00014549999999999999, 'samples': 111936, 'steps': 582, 'loss/train': 5.447309970855713} +11/06/2021 21:21:31 - INFO - __main__ - Step 583: {'lr': 0.00014549999999999999, 'samples': 111936, 'steps': 582, 'loss/train': 5.447309970855713} +11/06/2021 21:21:35 - INFO - __main__ - Step 591: {'lr': 0.0001475, 'samples': 113472, 'steps': 590, 'loss/train': 5.016930103302002}309970855713} +11/06/2021 21:21:36 - INFO - __main__ - Step 595: {'lr': 0.0001485, 'samples': 114240, 'steps': 594, 'loss/train': 4.915690898895264}309970855713} +11/06/2021 21:21:38 - INFO - __main__ - Step 599: {'lr': 0.0001495, 'samples': 115008, 'steps': 598, 'loss/train': 4.568467140197754}309970855713} +11/06/2021 21:21:38 - INFO - __main__ - Step 599: {'lr': 0.0001495, 'samples': 115008, 'steps': 598, 'loss/train': 4.568467140197754}309970855713} +11/06/2021 21:21:38 - INFO - __main__ - Step 599: {'lr': 0.0001495, 'samples': 115008, 'steps': 598, 'loss/train': 4.568467140197754}309970855713} +11/06/2021 21:21:44 - INFO - __main__ - Step 610: {'lr': 0.00015225, 'samples': 117120, 'steps': 609, 'loss/train': 4.78218412399292}309970855713} +11/06/2021 21:21:47 - INFO - __main__ - Step 615: {'lr': 0.0001535, 'samples': 118080, 'steps': 614, 'loss/train': 5.002647876739502}309970855713} +11/06/2021 21:21:49 - INFO - __main__ - Step 619: {'lr': 0.00015450000000000001, 'samples': 118848, 'steps': 618, 'loss/train': 4.601840019226074} +11/06/2021 21:21:51 - INFO - __main__ - Step 623: {'lr': 0.0001555, 'samples': 119616, 'steps': 622, 'loss/train': 4.604945182800293}840019226074} +11/06/2021 21:21:52 - INFO - __main__ - Step 627: {'lr': 0.0001565, 'samples': 120384, 'steps': 626, 'loss/train': 4.22480583190918}}840019226074} +11/06/2021 21:21:55 - INFO - __main__ - Step 631: {'lr': 0.0001575, 'samples': 121152, 'steps': 630, 'loss/train': 4.3496575355529785}40019226074} +11/06/2021 21:21:57 - INFO - __main__ - Step 636: {'lr': 0.00015875, 'samples': 122112, 'steps': 635, 'loss/train': 5.596816062927246}40019226074} +11/06/2021 21:21:59 - INFO - __main__ - Step 640: {'lr': 0.00015975, 'samples': 122880, 'steps': 639, 'loss/train': 5.002859115600586}40019226074} +11/06/2021 21:21:59 - INFO - __main__ - Step 640: {'lr': 0.00015975, 'samples': 122880, 'steps': 639, 'loss/train': 5.002859115600586}40019226074} +11/06/2021 21:22:02 - INFO - __main__ - Step 647: {'lr': 0.0001615, 'samples': 124224, 'steps': 646, 'loss/train': 4.445610046386719}}40019226074} +11/06/2021 21:22:04 - INFO - __main__ - Step 651: {'lr': 0.00016250000000000002, 'samples': 124992, 'steps': 650, 'loss/train': 4.449684143066406} +11/06/2021 21:22:07 - INFO - __main__ - Step 656: {'lr': 0.00016375000000000002, 'samples': 125952, 'steps': 655, 'loss/train': 4.627468109130859} +11/06/2021 21:22:09 - INFO - __main__ - Step 661: {'lr': 0.000165, 'samples': 126912, 'steps': 660, 'loss/train': 4.710036277770996}7468109130859} +11/06/2021 21:22:09 - INFO - __main__ - Step 661: {'lr': 0.000165, 'samples': 126912, 'steps': 660, 'loss/train': 4.710036277770996}7468109130859} +11/06/2021 21:22:12 - INFO - __main__ - Step 668: {'lr': 0.00016675000000000001, 'samples': 128256, 'steps': 667, 'loss/train': 4.959212303161621} +11/06/2021 21:22:15 - INFO - __main__ - Step 672: {'lr': 0.00016775, 'samples': 129024, 'steps': 671, 'loss/train': 4.435437202453613}12303161621} +11/06/2021 21:22:17 - INFO - __main__ - Step 677: {'lr': 0.00016900000000000002, 'samples': 129984, 'steps': 676, 'loss/train': 4.679195880889893} +11/06/2021 21:22:19 - INFO - __main__ - Step 681: {'lr': 0.00017, 'samples': 130752, 'steps': 680, 'loss/train': 4.423855781555176}79195880889893} +11/06/2021 21:22:21 - INFO - __main__ - Step 685: {'lr': 0.000171, 'samples': 131520, 'steps': 684, 'loss/train': 4.730793476104736}9195880889893} +11/06/2021 21:22:21 - INFO - __main__ - Step 685: {'lr': 0.000171, 'samples': 131520, 'steps': 684, 'loss/train': 4.730793476104736}9195880889893} +11/06/2021 21:22:25 - INFO - __main__ - Step 692: {'lr': 0.00017275, 'samples': 132864, 'steps': 691, 'loss/train': 4.4996209144592285}5880889893} +11/06/2021 21:22:25 - INFO - __main__ - Step 692: {'lr': 0.00017275, 'samples': 132864, 'steps': 691, 'loss/train': 4.4996209144592285}5880889893} +11/06/2021 21:22:25 - INFO - __main__ - Step 692: {'lr': 0.00017275, 'samples': 132864, 'steps': 691, 'loss/train': 4.4996209144592285}5880889893} +11/06/2021 21:22:31 - INFO - __main__ - Step 703: {'lr': 0.00017549999999999998, 'samples': 134976, 'steps': 702, 'loss/train': 4.290457248687744} +11/06/2021 21:22:33 - INFO - __main__ - Step 709: {'lr': 0.000177, 'samples': 136128, 'steps': 708, 'loss/train': 4.986819267272949}0457248687744} +11/06/2021 21:22:33 - INFO - __main__ - Step 709: {'lr': 0.000177, 'samples': 136128, 'steps': 708, 'loss/train': 4.986819267272949}0457248687744} +11/06/2021 21:22:37 - INFO - __main__ - Step 716: {'lr': 0.00017875, 'samples': 137472, 'steps': 715, 'loss/train': 4.557127475738525}57248687744} +11/06/2021 21:22:39 - INFO - __main__ - Step 720: {'lr': 0.00017975, 'samples': 138240, 'steps': 719, 'loss/train': 4.539857864379883}57248687744} +11/06/2021 21:22:39 - INFO - __main__ - Step 720: {'lr': 0.00017975, 'samples': 138240, 'steps': 719, 'loss/train': 4.539857864379883}57248687744} +11/06/2021 21:22:43 - INFO - __main__ - Step 728: {'lr': 0.00018175, 'samples': 139776, 'steps': 727, 'loss/train': 4.543506145477295}57248687744} +11/06/2021 21:22:45 - INFO - __main__ - Step 732: {'lr': 0.00018275, 'samples': 140544, 'steps': 731, 'loss/train': 4.329798221588135}57248687744} +11/06/2021 21:22:47 - INFO - __main__ - Step 736: {'lr': 0.00018375, 'samples': 141312, 'steps': 735, 'loss/train': 5.126845359802246}57248687744} +11/06/2021 21:22:49 - INFO - __main__ - Step 741: {'lr': 0.000185, 'samples': 142272, 'steps': 740, 'loss/train': 4.524784564971924}6}57248687744} +11/06/2021 21:22:51 - INFO - __main__ - Step 745: {'lr': 0.000186, 'samples': 143040, 'steps': 744, 'loss/train': 4.4243059158325195}}57248687744} +11/06/2021 21:22:51 - INFO - __main__ - Step 745: {'lr': 0.000186, 'samples': 143040, 'steps': 744, 'loss/train': 4.4243059158325195}}57248687744} +11/06/2021 21:22:55 - INFO - __main__ - Step 752: {'lr': 0.00018775, 'samples': 144384, 'steps': 751, 'loss/train': 4.103482723236084}57248687744} +11/06/2021 21:22:57 - INFO - __main__ - Step 757: {'lr': 0.000189, 'samples': 145344, 'steps': 756, 'loss/train': 4.462242126464844}4}57248687744} +11/06/2021 21:22:57 - INFO - __main__ - Step 757: {'lr': 0.000189, 'samples': 145344, 'steps': 756, 'loss/train': 4.462242126464844}4}57248687744} +11/06/2021 21:23:02 - INFO - __main__ - Step 765: {'lr': 0.000191, 'samples': 146880, 'steps': 764, 'loss/train': 4.935421466827393}4}57248687744} +11/06/2021 21:23:04 - INFO - __main__ - Step 769: {'lr': 0.000192, 'samples': 147648, 'steps': 768, 'loss/train': 5.1701979637146}3}4}57248687744} +11/06/2021 21:23:05 - INFO - __main__ - Step 773: {'lr': 0.000193, 'samples': 148416, 'steps': 772, 'loss/train': 4.7581634521484375}}57248687744} +11/06/2021 21:23:07 - INFO - __main__ - Step 777: {'lr': 0.000194, 'samples': 149184, 'steps': 776, 'loss/train': 4.947287559509277}}}57248687744} +11/06/2021 21:23:10 - INFO - __main__ - Step 782: {'lr': 0.00019525, 'samples': 150144, 'steps': 781, 'loss/train': 4.558263301849365}57248687744} +11/06/2021 21:23:12 - INFO - __main__ - Step 786: {'lr': 0.00019625, 'samples': 150912, 'steps': 785, 'loss/train': 4.140824317932129}57248687744} +11/06/2021 21:23:12 - INFO - __main__ - Step 786: {'lr': 0.00019625, 'samples': 150912, 'steps': 785, 'loss/train': 4.140824317932129}57248687744} +11/06/2021 21:23:15 - INFO - __main__ - Step 793: {'lr': 0.00019800000000000002, 'samples': 152256, 'steps': 792, 'loss/train': 4.764225482940674} +11/06/2021 21:23:17 - INFO - __main__ - Step 797: {'lr': 0.000199, 'samples': 153024, 'steps': 796, 'loss/train': 4.558513641357422}4225482940674} +11/06/2021 21:23:17 - INFO - __main__ - Step 797: {'lr': 0.000199, 'samples': 153024, 'steps': 796, 'loss/train': 4.558513641357422}4225482940674} +11/06/2021 21:23:21 - INFO - __main__ - Step 804: {'lr': 0.00020075000000000003, 'samples': 154368, 'steps': 803, 'loss/train': 2.2776834964752197} +11/06/2021 21:23:21 - INFO - __main__ - Step 804: {'lr': 0.00020075000000000003, 'samples': 154368, 'steps': 803, 'loss/train': 2.2776834964752197} +11/06/2021 21:23:26 - INFO - __main__ - Step 812: {'lr': 0.00020275000000000002, 'samples': 155904, 'steps': 811, 'loss/train': 4.3080902099609375} +11/06/2021 21:23:27 - INFO - __main__ - Step 816: {'lr': 0.00020375, 'samples': 156672, 'steps': 815, 'loss/train': 4.675464153289795}902099609375} +11/06/2021 21:23:29 - INFO - __main__ - Step 820: {'lr': 0.00020475, 'samples': 157440, 'steps': 819, 'loss/train': 5.175144672393799}902099609375} +11/06/2021 21:23:32 - INFO - __main__ - Step 825: {'lr': 0.000206, 'samples': 158400, 'steps': 824, 'loss/train': 4.396790981292725}9}902099609375} +11/06/2021 21:23:34 - INFO - __main__ - Step 829: {'lr': 0.000207, 'samples': 159168, 'steps': 828, 'loss/train': 4.163397312164307}9}902099609375} +11/06/2021 21:23:36 - INFO - __main__ - Step 833: {'lr': 0.000208, 'samples': 159936, 'steps': 832, 'loss/train': 4.7883687019348145}}902099609375} +11/06/2021 21:23:37 - INFO - __main__ - Step 837: {'lr': 0.00020899999999999998, 'samples': 160704, 'steps': 836, 'loss/train': 4.873067378997803}} +11/06/2021 21:23:40 - INFO - __main__ - Step 841: {'lr': 0.00021, 'samples': 161472, 'steps': 840, 'loss/train': 6.019371509552002}73067378997803}} +11/06/2021 21:23:40 - INFO - __main__ - Step 841: {'lr': 0.00021, 'samples': 161472, 'steps': 840, 'loss/train': 6.019371509552002}73067378997803}} +11/06/2021 21:23:43 - INFO - __main__ - Step 848: {'lr': 0.00021175, 'samples': 162816, 'steps': 847, 'loss/train': 4.035452842712402}67378997803}} +11/06/2021 21:23:45 - INFO - __main__ - Step 852: {'lr': 0.00021275, 'samples': 163584, 'steps': 851, 'loss/train': 4.537678241729736}67378997803}} +11/06/2021 21:23:45 - INFO - __main__ - Step 852: {'lr': 0.00021275, 'samples': 163584, 'steps': 851, 'loss/train': 4.537678241729736}67378997803}} +11/06/2021 21:23:45 - INFO - __main__ - Step 852: {'lr': 0.00021275, 'samples': 163584, 'steps': 851, 'loss/train': 4.537678241729736}67378997803}} +11/06/2021 21:23:51 - INFO - __main__ - Step 863: {'lr': 0.0002155, 'samples': 165696, 'steps': 862, 'loss/train': 4.436905384063721}}67378997803}} +11/06/2021 21:23:53 - INFO - __main__ - Step 867: {'lr': 0.0002165, 'samples': 166464, 'steps': 866, 'loss/train': 4.653875827789307}}67378997803}} +11/06/2021 21:23:55 - INFO - __main__ - Step 872: {'lr': 0.00021775, 'samples': 167424, 'steps': 871, 'loss/train': 1.9217588901519775}7378997803}} +11/06/2021 21:23:58 - INFO - __main__ - Step 877: {'lr': 0.000219, 'samples': 168384, 'steps': 876, 'loss/train': 4.769442558288574}75}7378997803}} +11/06/2021 21:23:58 - INFO - __main__ - Step 877: {'lr': 0.000219, 'samples': 168384, 'steps': 876, 'loss/train': 4.769442558288574}75}7378997803}} +11/06/2021 21:24:02 - INFO - __main__ - Step 884: {'lr': 0.00022075, 'samples': 169728, 'steps': 883, 'loss/train': 4.347689151763916}}7378997803}} +11/06/2021 21:24:03 - INFO - __main__ - Step 888: {'lr': 0.00022175, 'samples': 170496, 'steps': 887, 'loss/train': 4.312256813049316}}7378997803}} +11/06/2021 21:24:05 - INFO - __main__ - Step 892: {'lr': 0.00022275000000000002, 'samples': 171264, 'steps': 891, 'loss/train': 4.234619617462158}} +11/06/2021 21:24:07 - INFO - __main__ - Step 897: {'lr': 0.000224, 'samples': 172224, 'steps': 896, 'loss/train': 3.291337251663208}4619617462158}} +11/06/2021 21:24:10 - INFO - __main__ - Step 903: {'lr': 0.0002255, 'samples': 173376, 'steps': 902, 'loss/train': 4.559982776641846}619617462158}} +11/06/2021 21:24:10 - INFO - __main__ - Step 903: {'lr': 0.0002255, 'samples': 173376, 'steps': 902, 'loss/train': 4.559982776641846}619617462158}} +11/06/2021 21:24:10 - INFO - __main__ - Step 903: {'lr': 0.0002255, 'samples': 173376, 'steps': 902, 'loss/train': 4.559982776641846}619617462158}} +11/06/2021 21:24:15 - INFO - __main__ - Step 913: {'lr': 0.000228, 'samples': 175296, 'steps': 912, 'loss/train': 4.5875163078308105}619617462158}} +11/06/2021 21:24:15 - INFO - __main__ - Step 913: {'lr': 0.000228, 'samples': 175296, 'steps': 912, 'loss/train': 4.5875163078308105}619617462158}} +11/06/2021 21:24:19 - INFO - __main__ - Step 921: {'lr': 0.00023, 'samples': 176832, 'steps': 920, 'loss/train': 4.508198261260986}5}619617462158}} +11/06/2021 21:24:21 - INFO - __main__ - Step 925: {'lr': 0.000231, 'samples': 177600, 'steps': 924, 'loss/train': 5.673306941986084}}619617462158}} +11/06/2021 21:24:23 - INFO - __main__ - Step 929: {'lr': 0.00023200000000000003, 'samples': 178368, 'steps': 928, 'loss/train': 3.650172233581543}} +11/06/2021 21:24:25 - INFO - __main__ - Step 934: {'lr': 0.00023325, 'samples': 179328, 'steps': 933, 'loss/train': 3.821877956390381}72233581543}} +11/06/2021 21:24:25 - INFO - __main__ - Step 934: {'lr': 0.00023325, 'samples': 179328, 'steps': 933, 'loss/train': 3.821877956390381}72233581543}} +11/06/2021 21:24:30 - INFO - __main__ - Step 942: {'lr': 0.00023525, 'samples': 180864, 'steps': 941, 'loss/train': 4.118391036987305}72233581543}} +11/06/2021 21:24:32 - INFO - __main__ - Step 946: {'lr': 0.00023625, 'samples': 181632, 'steps': 945, 'loss/train': 4.698647975921631}72233581543}} +11/06/2021 21:24:33 - INFO - __main__ - Step 950: {'lr': 0.00023725, 'samples': 182400, 'steps': 949, 'loss/train': 4.038322448730469}72233581543}} +11/06/2021 21:24:35 - INFO - __main__ - Step 954: {'lr': 0.00023825, 'samples': 183168, 'steps': 953, 'loss/train': 4.3065505027771}9}72233581543}} +11/06/2021 21:24:38 - INFO - __main__ - Step 959: {'lr': 0.0002395, 'samples': 184128, 'steps': 958, 'loss/train': 4.376034259796143}}72233581543}} +11/06/2021 21:24:38 - INFO - __main__ - Step 959: {'lr': 0.0002395, 'samples': 184128, 'steps': 958, 'loss/train': 4.376034259796143}}72233581543}} +11/06/2021 21:24:41 - INFO - __main__ - Step 966: {'lr': 0.00024125, 'samples': 185472, 'steps': 965, 'loss/train': 4.45121431350708}}72233581543}} +11/06/2021 21:24:43 - INFO - __main__ - Step 970: {'lr': 0.00024225, 'samples': 186240, 'steps': 969, 'loss/train': 4.633758544921875}72233581543}} +11/06/2021 21:24:46 - INFO - __main__ - Step 975: {'lr': 0.0002435, 'samples': 187200, 'steps': 974, 'loss/train': 4.149434566497803}}72233581543}} +11/06/2021 21:24:48 - INFO - __main__ - Step 979: {'lr': 0.0002445, 'samples': 187968, 'steps': 978, 'loss/train': 4.069120407104492}}72233581543}} +11/06/2021 21:24:50 - INFO - __main__ - Step 983: {'lr': 0.0002455, 'samples': 188736, 'steps': 982, 'loss/train': 4.437088966369629}}72233581543}} +11/06/2021 21:24:51 - INFO - __main__ - Step 987: {'lr': 0.00024650000000000003, 'samples': 189504, 'steps': 986, 'loss/train': 3.8113763332366943} +11/06/2021 21:24:53 - INFO - __main__ - Step 991: {'lr': 0.0002475, 'samples': 190272, 'steps': 990, 'loss/train': 4.3600897789001465}763332366943} +11/06/2021 21:24:56 - INFO - __main__ - Step 996: {'lr': 0.00024875, 'samples': 191232, 'steps': 995, 'loss/train': 4.652307510375977}763332366943} +11/06/2021 21:24:58 - INFO - __main__ - Step 1000: {'lr': 0.00024975, 'samples': 192000, 'steps': 999, 'loss/train': 4.688298225402832}63332366943} +11/06/2021 21:24:58 - INFO - __main__ - Step 1000: {'lr': 0.00024975, 'samples': 192000, 'steps': 999, 'loss/train': 4.688298225402832}63332366943} +11/06/2021 21:25:01 - INFO - __main__ - Step 1007: {'lr': 0.0002515, 'samples': 193344, 'steps': 1006, 'loss/train': 2.1154818534851074}3332366943} +11/06/2021 21:25:04 - INFO - __main__ - Step 1012: {'lr': 0.00025275, 'samples': 194304, 'steps': 1011, 'loss/train': 3.661561965942383}3332366943} +11/06/2021 21:25:06 - INFO - __main__ - Step 1017: {'lr': 0.000254, 'samples': 195264, 'steps': 1016, 'loss/train': 6.699620723724365}3}3332366943} +11/06/2021 21:25:08 - INFO - __main__ - Step 1021: {'lr': 0.000255, 'samples': 196032, 'steps': 1020, 'loss/train': 3.97232723236084}}3}3332366943} +11/06/2021 21:25:10 - INFO - __main__ - Step 1025: {'lr': 0.000256, 'samples': 196800, 'steps': 1024, 'loss/train': 4.093658924102783}3}3332366943} +11/06/2021 21:25:11 - INFO - __main__ - Step 1029: {'lr': 0.000257, 'samples': 197568, 'steps': 1028, 'loss/train': 3.6540799140930176}}3332366943} +11/06/2021 21:25:14 - INFO - __main__ - Step 1033: {'lr': 0.00025800000000000004, 'samples': 198336, 'steps': 1032, 'loss/train': 1.9851371049880981} +11/06/2021 21:25:16 - INFO - __main__ - Step 1038: {'lr': 0.00025925, 'samples': 199296, 'steps': 1037, 'loss/train': 5.716175556182861}371049880981} +11/06/2021 21:25:18 - INFO - __main__ - Step 1042: {'lr': 0.00026025, 'samples': 200064, 'steps': 1041, 'loss/train': 4.489924430847168}371049880981} +11/06/2021 21:25:18 - INFO - __main__ - Step 1042: {'lr': 0.00026025, 'samples': 200064, 'steps': 1041, 'loss/train': 4.489924430847168}371049880981} +11/06/2021 21:25:21 - INFO - __main__ - Step 1049: {'lr': 0.000262, 'samples': 201408, 'steps': 1048, 'loss/train': 3.938405990600586}8}371049880981} +11/06/2021 21:25:23 - INFO - __main__ - Step 1053: {'lr': 0.000263, 'samples': 202176, 'steps': 1052, 'loss/train': 4.3338303565979}6}8}371049880981} +11/06/2021 21:25:26 - INFO - __main__ - Step 1058: {'lr': 0.00026425, 'samples': 203136, 'steps': 1057, 'loss/train': 4.140725135803223}371049880981} +11/06/2021 21:25:26 - INFO - __main__ - Step 1058: {'lr': 0.00026425, 'samples': 203136, 'steps': 1057, 'loss/train': 4.140725135803223}371049880981} +11/06/2021 21:25:30 - INFO - __main__ - Step 1066: {'lr': 0.00026625, 'samples': 204672, 'steps': 1065, 'loss/train': 3.962754011154175}371049880981} +11/06/2021 21:25:31 - INFO - __main__ - Step 1070: {'lr': 0.00026725, 'samples': 205440, 'steps': 1069, 'loss/train': 2.362624168395996}371049880981} +11/06/2021 21:25:34 - INFO - __main__ - Step 1074: {'lr': 0.00026825, 'samples': 206208, 'steps': 1073, 'loss/train': 3.240086078643799}371049880981} +11/06/2021 21:25:36 - INFO - __main__ - Step 1079: {'lr': 0.00026950000000000005, 'samples': 207168, 'steps': 1078, 'loss/train': 4.370131015777588}} +11/06/2021 21:25:38 - INFO - __main__ - Step 1084: {'lr': 0.00027075, 'samples': 208128, 'steps': 1083, 'loss/train': 3.959185838699341}31015777588}} +11/06/2021 21:25:38 - INFO - __main__ - Step 1084: {'lr': 0.00027075, 'samples': 208128, 'steps': 1083, 'loss/train': 3.959185838699341}31015777588}} +11/06/2021 21:25:42 - INFO - __main__ - Step 1091: {'lr': 0.0002725, 'samples': 209472, 'steps': 1090, 'loss/train': 3.5656397342681885}31015777588}} +11/06/2021 21:25:44 - INFO - __main__ - Step 1095: {'lr': 0.00027350000000000003, 'samples': 210240, 'steps': 1094, 'loss/train': 4.242520332336426}} +11/06/2021 21:25:46 - INFO - __main__ - Step 1099: {'lr': 0.0002745, 'samples': 211008, 'steps': 1098, 'loss/train': 4.089423179626465}520332336426}} +11/06/2021 21:25:48 - INFO - __main__ - Step 1103: {'lr': 0.00027550000000000003, 'samples': 211776, 'steps': 1102, 'loss/train': 6.588270664215088}} +11/06/2021 21:25:48 - INFO - __main__ - Step 1103: {'lr': 0.00027550000000000003, 'samples': 211776, 'steps': 1102, 'loss/train': 6.588270664215088}} +11/06/2021 21:25:52 - INFO - __main__ - Step 1110: {'lr': 0.00027725, 'samples': 213120, 'steps': 1109, 'loss/train': 4.272808074951172}70664215088}} +11/06/2021 21:25:52 - INFO - __main__ - Step 1110: {'lr': 0.00027725, 'samples': 213120, 'steps': 1109, 'loss/train': 4.272808074951172}70664215088}} +11/06/2021 21:25:56 - INFO - __main__ - Step 1118: {'lr': 0.00027925, 'samples': 214656, 'steps': 1117, 'loss/train': 4.0414958000183105}0664215088}} +11/06/2021 21:25:57 - INFO - __main__ - Step 1122: {'lr': 0.00028025, 'samples': 215424, 'steps': 1121, 'loss/train': 4.281680583953857}}0664215088}} +11/06/2021 21:26:00 - INFO - __main__ - Step 1126: {'lr': 0.00028125000000000003, 'samples': 216192, 'steps': 1125, 'loss/train': 4.240171432495117}} +11/06/2021 21:26:00 - INFO - __main__ - Step 1126: {'lr': 0.00028125000000000003, 'samples': 216192, 'steps': 1125, 'loss/train': 4.240171432495117}} +11/06/2021 21:26:04 - INFO - __main__ - Step 1134: {'lr': 0.00028325000000000003, 'samples': 217728, 'steps': 1133, 'loss/train': 4.218957424163818}} +11/06/2021 21:26:06 - INFO - __main__ - Step 1138: {'lr': 0.00028425, 'samples': 218496, 'steps': 1137, 'loss/train': 4.085984706878662}57424163818}} +11/06/2021 21:26:07 - INFO - __main__ - Step 1142: {'lr': 0.00028525, 'samples': 219264, 'steps': 1141, 'loss/train': 3.885024070739746}57424163818}} +11/06/2021 21:26:10 - INFO - __main__ - Step 1146: {'lr': 0.00028625, 'samples': 220032, 'steps': 1145, 'loss/train': 3.5987935066223145}7424163818}} +11/06/2021 21:26:12 - INFO - __main__ - Step 1151: {'lr': 0.0002875, 'samples': 220992, 'steps': 1150, 'loss/train': 3.9367594718933105}}7424163818}} +11/06/2021 21:26:14 - INFO - __main__ - Step 1155: {'lr': 0.00028849999999999997, 'samples': 221760, 'steps': 1154, 'loss/train': 4.096200942993164}} +11/06/2021 21:26:16 - INFO - __main__ - Step 1159: {'lr': 0.0002895, 'samples': 222528, 'steps': 1158, 'loss/train': 2.7520174980163574}00942993164}} +11/06/2021 21:26:18 - INFO - __main__ - Step 1163: {'lr': 0.00029049999999999996, 'samples': 223296, 'steps': 1162, 'loss/train': 4.1517109870910645} +11/06/2021 21:26:20 - INFO - __main__ - Step 1167: {'lr': 0.0002915, 'samples': 224064, 'steps': 1166, 'loss/train': 3.959521770477295}7109870910645} +11/06/2021 21:26:22 - INFO - __main__ - Step 1172: {'lr': 0.00029275000000000004, 'samples': 225024, 'steps': 1171, 'loss/train': 4.092573642730713}} +11/06/2021 21:26:24 - INFO - __main__ - Step 1176: {'lr': 0.00029375, 'samples': 225792, 'steps': 1175, 'loss/train': 3.6532394886016846}3642730713}} +11/06/2021 21:26:24 - INFO - __main__ - Step 1176: {'lr': 0.00029375, 'samples': 225792, 'steps': 1175, 'loss/train': 3.6532394886016846}3642730713}} +11/06/2021 21:26:27 - INFO - __main__ - Step 1183: {'lr': 0.00029549999999999997, 'samples': 227136, 'steps': 1182, 'loss/train': 4.172230243682861}} +11/06/2021 21:26:30 - INFO - __main__ - Step 1188: {'lr': 0.00029675000000000003, 'samples': 228096, 'steps': 1187, 'loss/train': 3.7164466381073}1}} +11/06/2021 21:26:32 - INFO - __main__ - Step 1193: {'lr': 0.000298, 'samples': 229056, 'steps': 1192, 'loss/train': 5.458200454711914}64466381073}1}} +11/06/2021 21:26:32 - INFO - __main__ - Step 1193: {'lr': 0.000298, 'samples': 229056, 'steps': 1192, 'loss/train': 5.458200454711914}64466381073}1}} +11/06/2021 21:26:36 - INFO - __main__ - Step 1200: {'lr': 0.00029975000000000005, 'samples': 230400, 'steps': 1199, 'loss/train': 4.041784286499023}} +11/06/2021 21:26:37 - INFO - __main__ - Step 1204: {'lr': 0.00030075, 'samples': 231168, 'steps': 1203, 'loss/train': 4.123647689819336}84286499023}} +11/06/2021 21:26:40 - INFO - __main__ - Step 1208: {'lr': 0.00030175000000000004, 'samples': 231936, 'steps': 1207, 'loss/train': 4.022327423095703}} +11/06/2021 21:26:42 - INFO - __main__ - Step 1213: {'lr': 0.000303, 'samples': 232896, 'steps': 1212, 'loss/train': 3.7347517013549805}327423095703}} +11/06/2021 21:26:44 - INFO - __main__ - Step 1218: {'lr': 0.00030425000000000005, 'samples': 233856, 'steps': 1217, 'loss/train': 3.7530202865600586} +11/06/2021 21:26:44 - INFO - __main__ - Step 1218: {'lr': 0.00030425000000000005, 'samples': 233856, 'steps': 1217, 'loss/train': 3.7530202865600586} +11/06/2021 21:26:44 - INFO - __main__ - Step 1218: {'lr': 0.00030425000000000005, 'samples': 233856, 'steps': 1217, 'loss/train': 3.7530202865600586} +11/06/2021 21:26:50 - INFO - __main__ - Step 1229: {'lr': 0.000307, 'samples': 235968, 'steps': 1228, 'loss/train': 4.392697811126709}30202865600586} +11/06/2021 21:26:52 - INFO - __main__ - Step 1234: {'lr': 0.00030825000000000004, 'samples': 236928, 'steps': 1233, 'loss/train': 3.6062018871307373} +11/06/2021 21:26:54 - INFO - __main__ - Step 1238: {'lr': 0.00030925, 'samples': 237696, 'steps': 1237, 'loss/train': 5.033356666564941}018871307373} +11/06/2021 21:26:56 - INFO - __main__ - Step 1242: {'lr': 0.00031025000000000003, 'samples': 238464, 'steps': 1241, 'loss/train': 3.553842067718506}} +11/06/2021 21:26:58 - INFO - __main__ - Step 1246: {'lr': 0.00031125000000000006, 'samples': 239232, 'steps': 1245, 'loss/train': 3.7371480464935303} +11/06/2021 21:27:00 - INFO - __main__ - Step 1250: {'lr': 0.00031225000000000003, 'samples': 240000, 'steps': 1249, 'loss/train': 3.6074068546295166} +11/06/2021 21:27:02 - INFO - __main__ - Step 1255: {'lr': 0.00031350000000000003, 'samples': 240960, 'steps': 1254, 'loss/train': 3.425907850265503}} +11/06/2021 21:27:04 - INFO - __main__ - Step 1259: {'lr': 0.0003145, 'samples': 241728, 'steps': 1258, 'loss/train': 4.367678642272949}907850265503}} +11/06/2021 21:27:04 - INFO - __main__ - Step 1259: {'lr': 0.0003145, 'samples': 241728, 'steps': 1258, 'loss/train': 4.367678642272949}907850265503}} +11/06/2021 21:27:07 - INFO - __main__ - Step 1266: {'lr': 0.00031624999999999996, 'samples': 243072, 'steps': 1265, 'loss/train': 3.6147239208221436} +11/06/2021 21:27:10 - INFO - __main__ - Step 1271: {'lr': 0.0003175, 'samples': 244032, 'steps': 1270, 'loss/train': 3.718264102935791}7239208221436} +11/06/2021 21:27:10 - INFO - __main__ - Step 1271: {'lr': 0.0003175, 'samples': 244032, 'steps': 1270, 'loss/train': 3.718264102935791}7239208221436} +11/06/2021 21:27:14 - INFO - __main__ - Step 1278: {'lr': 0.00031925, 'samples': 245376, 'steps': 1277, 'loss/train': 2.880706548690796}239208221436} +11/06/2021 21:27:16 - INFO - __main__ - Step 1282: {'lr': 0.00032025, 'samples': 246144, 'steps': 1281, 'loss/train': 2.492274761199951}239208221436} +11/06/2021 21:27:18 - INFO - __main__ - Step 1286: {'lr': 0.00032125, 'samples': 246912, 'steps': 1285, 'loss/train': 4.252817153930664}239208221436} +11/06/2021 21:27:20 - INFO - __main__ - Step 1291: {'lr': 0.00032250000000000003, 'samples': 247872, 'steps': 1290, 'loss/train': 3.7204911708831787} +11/06/2021 21:27:23 - INFO - __main__ - Step 1296: {'lr': 0.00032375, 'samples': 248832, 'steps': 1295, 'loss/train': 3.61068058013916}4911708831787} +11/06/2021 21:27:25 - INFO - __main__ - Step 1300: {'lr': 0.00032475, 'samples': 249600, 'steps': 1299, 'loss/train': 3.8040266036987305}11708831787} +11/06/2021 21:27:27 - INFO - __main__ - Step 1304: {'lr': 0.00032575, 'samples': 250368, 'steps': 1303, 'loss/train': 3.846041440963745}}11708831787} +11/06/2021 21:27:27 - INFO - __main__ - Step 1304: {'lr': 0.00032575, 'samples': 250368, 'steps': 1303, 'loss/train': 3.846041440963745}}11708831787} +11/06/2021 21:27:30 - INFO - __main__ - Step 1311: {'lr': 0.00032750000000000005, 'samples': 251712, 'steps': 1310, 'loss/train': 3.8077216148376465} +11/06/2021 21:27:33 - INFO - __main__ - Step 1317: {'lr': 0.00032900000000000003, 'samples': 252864, 'steps': 1316, 'loss/train': 3.848276138305664}} +11/06/2021 21:27:35 - INFO - __main__ - Step 1321: {'lr': 0.00033, 'samples': 253632, 'steps': 1320, 'loss/train': 3.623622179031372}48276138305664}} +11/06/2021 21:27:35 - INFO - __main__ - Step 1321: {'lr': 0.00033, 'samples': 253632, 'steps': 1320, 'loss/train': 3.623622179031372}48276138305664}} +11/06/2021 21:27:38 - INFO - __main__ - Step 1328: {'lr': 0.00033175, 'samples': 254976, 'steps': 1327, 'loss/train': 3.815504550933838}76138305664}} +11/06/2021 21:27:40 - INFO - __main__ - Step 1332: {'lr': 0.00033275, 'samples': 255744, 'steps': 1331, 'loss/train': 3.404329299926758}76138305664}} +11/06/2021 21:27:40 - INFO - __main__ - Step 1332: {'lr': 0.00033275, 'samples': 255744, 'steps': 1331, 'loss/train': 3.404329299926758}76138305664}} +11/06/2021 21:27:40 - INFO - __main__ - Step 1332: {'lr': 0.00033275, 'samples': 255744, 'steps': 1331, 'loss/train': 3.404329299926758}76138305664}} +11/06/2021 21:27:46 - INFO - __main__ - Step 1343: {'lr': 0.0003355, 'samples': 257856, 'steps': 1342, 'loss/train': 3.234477996826172}}76138305664}} +11/06/2021 21:27:48 - INFO - __main__ - Step 1347: {'lr': 0.00033650000000000005, 'samples': 258624, 'steps': 1346, 'loss/train': 3.310671329498291}} +11/06/2021 21:27:50 - INFO - __main__ - Step 1352: {'lr': 0.00033775, 'samples': 259584, 'steps': 1351, 'loss/train': 3.3598763942718506}1329498291}} +11/06/2021 21:27:53 - INFO - __main__ - Step 1356: {'lr': 0.00033875, 'samples': 260352, 'steps': 1355, 'loss/train': 3.3796229362487793}1329498291}} +11/06/2021 21:27:55 - INFO - __main__ - Step 1360: {'lr': 0.00033975, 'samples': 261120, 'steps': 1359, 'loss/train': 3.659208059310913}}1329498291}} +11/06/2021 21:27:56 - INFO - __main__ - Step 1364: {'lr': 0.00034075, 'samples': 261888, 'steps': 1363, 'loss/train': 4.257739543914795}}1329498291}} +11/06/2021 21:27:58 - INFO - __main__ - Step 1368: {'lr': 0.00034175, 'samples': 262656, 'steps': 1367, 'loss/train': 2.7847213745117188}1329498291}} +11/06/2021 21:27:58 - INFO - __main__ - Step 1368: {'lr': 0.00034175, 'samples': 262656, 'steps': 1367, 'loss/train': 2.7847213745117188}1329498291}} +11/06/2021 21:28:03 - INFO - __main__ - Step 1376: {'lr': 0.00034375, 'samples': 264192, 'steps': 1375, 'loss/train': 3.6449296474456787}1329498291}} +11/06/2021 21:28:05 - INFO - __main__ - Step 1380: {'lr': 0.00034475, 'samples': 264960, 'steps': 1379, 'loss/train': 3.7418301105499268}1329498291}} +11/06/2021 21:28:06 - INFO - __main__ - Step 1384: {'lr': 0.00034575000000000003, 'samples': 265728, 'steps': 1383, 'loss/train': 3.5448079109191895} +11/06/2021 21:28:08 - INFO - __main__ - Step 1388: {'lr': 0.00034675, 'samples': 266496, 'steps': 1387, 'loss/train': 5.252135276794434}079109191895} +11/06/2021 21:28:11 - INFO - __main__ - Step 1393: {'lr': 0.000348, 'samples': 267456, 'steps': 1392, 'loss/train': 3.698169231414795}4}079109191895} +11/06/2021 21:28:11 - INFO - __main__ - Step 1393: {'lr': 0.000348, 'samples': 267456, 'steps': 1392, 'loss/train': 3.698169231414795}4}079109191895} +11/06/2021 21:28:15 - INFO - __main__ - Step 1401: {'lr': 0.00035, 'samples': 268992, 'steps': 1400, 'loss/train': 3.4211158752441406}4}079109191895} +11/06/2021 21:28:16 - INFO - __main__ - Step 1405: {'lr': 0.00035099999999999997, 'samples': 269760, 'steps': 1404, 'loss/train': 3.948554277420044}} +11/06/2021 21:28:18 - INFO - __main__ - Step 1409: {'lr': 0.000352, 'samples': 270528, 'steps': 1408, 'loss/train': 3.544276237487793}8554277420044}} +11/06/2021 21:28:18 - INFO - __main__ - Step 1409: {'lr': 0.000352, 'samples': 270528, 'steps': 1408, 'loss/train': 3.544276237487793}8554277420044}} +11/06/2021 21:28:23 - INFO - __main__ - Step 1417: {'lr': 0.000354, 'samples': 272064, 'steps': 1416, 'loss/train': 3.9992828369140625}554277420044}} +11/06/2021 21:28:23 - INFO - __main__ - Step 1417: {'lr': 0.000354, 'samples': 272064, 'steps': 1416, 'loss/train': 3.9992828369140625}554277420044}} +11/06/2021 21:28:26 - INFO - __main__ - Step 1424: {'lr': 0.00035575, 'samples': 273408, 'steps': 1423, 'loss/train': 4.185265064239502}54277420044}} +11/06/2021 21:28:29 - INFO - __main__ - Step 1430: {'lr': 0.00035725000000000004, 'samples': 274560, 'steps': 1429, 'loss/train': 3.588322162628174}} +11/06/2021 21:28:31 - INFO - __main__ - Step 1434: {'lr': 0.00035825, 'samples': 275328, 'steps': 1433, 'loss/train': 3.3060061931610107}2162628174}} +11/06/2021 21:28:33 - INFO - __main__ - Step 1438: {'lr': 0.00035925000000000003, 'samples': 276096, 'steps': 1437, 'loss/train': 3.045379877090454}} +11/06/2021 21:28:33 - INFO - __main__ - Step 1438: {'lr': 0.00035925000000000003, 'samples': 276096, 'steps': 1437, 'loss/train': 3.045379877090454}} +11/06/2021 21:28:36 - INFO - __main__ - Step 1445: {'lr': 0.000361, 'samples': 277440, 'steps': 1444, 'loss/train': 3.245635747909546}5379877090454}} +11/06/2021 21:28:39 - INFO - __main__ - Step 1450: {'lr': 0.00036225000000000005, 'samples': 278400, 'steps': 1449, 'loss/train': 3.1428816318511963} +11/06/2021 21:28:41 - INFO - __main__ - Step 1455: {'lr': 0.0003635, 'samples': 279360, 'steps': 1454, 'loss/train': 3.257840871810913}8816318511963} +11/06/2021 21:28:41 - INFO - __main__ - Step 1455: {'lr': 0.0003635, 'samples': 279360, 'steps': 1454, 'loss/train': 3.257840871810913}8816318511963} +11/06/2021 21:28:44 - INFO - __main__ - Step 1462: {'lr': 0.00036525, 'samples': 280704, 'steps': 1461, 'loss/train': 3.5692012310028076}16318511963} +11/06/2021 21:28:46 - INFO - __main__ - Step 1466: {'lr': 0.00036625000000000004, 'samples': 281472, 'steps': 1465, 'loss/train': 3.158153772354126}} +11/06/2021 21:28:49 - INFO - __main__ - Step 1471: {'lr': 0.0003675, 'samples': 282432, 'steps': 1470, 'loss/train': 3.3369407653808594}53772354126}} +11/06/2021 21:28:51 - INFO - __main__ - Step 1475: {'lr': 0.0003685, 'samples': 283200, 'steps': 1474, 'loss/train': 2.7034976482391357}53772354126}} +11/06/2021 21:28:51 - INFO - __main__ - Step 1475: {'lr': 0.0003685, 'samples': 283200, 'steps': 1474, 'loss/train': 2.7034976482391357}53772354126}} +11/06/2021 21:28:54 - INFO - __main__ - Step 1481: {'lr': 0.00037, 'samples': 284352, 'steps': 1480, 'loss/train': 3.1665492057800293}7}53772354126}} +11/06/2021 21:28:54 - INFO - __main__ - Step 1481: {'lr': 0.00037, 'samples': 284352, 'steps': 1480, 'loss/train': 3.1665492057800293}7}53772354126}} +11/06/2021 21:28:58 - INFO - __main__ - Step 1489: {'lr': 0.000372, 'samples': 285888, 'steps': 1488, 'loss/train': 3.5077946186065674}}53772354126}} +11/06/2021 21:29:00 - INFO - __main__ - Step 1493: {'lr': 0.000373, 'samples': 286656, 'steps': 1492, 'loss/train': 3.127577066421509}}}53772354126}} +11/06/2021 21:29:00 - INFO - __main__ - Step 1493: {'lr': 0.000373, 'samples': 286656, 'steps': 1492, 'loss/train': 3.127577066421509}}}53772354126}} +11/06/2021 21:29:04 - INFO - __main__ - Step 1500: {'lr': 0.00037475000000000003, 'samples': 288000, 'steps': 1499, 'loss/train': 3.4952762126922607} +11/06/2021 21:29:07 - INFO - __main__ - Step 1504: {'lr': 0.00037575, 'samples': 288768, 'steps': 1503, 'loss/train': 4.3909077644348145}62126922607} +11/06/2021 21:29:09 - INFO - __main__ - Step 1509: {'lr': 0.000377, 'samples': 289728, 'steps': 1508, 'loss/train': 3.3940863609313965}5}62126922607} +11/06/2021 21:29:11 - INFO - __main__ - Step 1513: {'lr': 0.000378, 'samples': 290496, 'steps': 1512, 'loss/train': 3.0633351802825928}5}62126922607} +11/06/2021 21:29:11 - INFO - __main__ - Step 1513: {'lr': 0.000378, 'samples': 290496, 'steps': 1512, 'loss/train': 3.0633351802825928}5}62126922607} +11/06/2021 21:29:11 - INFO - __main__ - Step 1513: {'lr': 0.000378, 'samples': 290496, 'steps': 1512, 'loss/train': 3.0633351802825928}5}62126922607} +11/06/2021 21:29:17 - INFO - __main__ - Step 1523: {'lr': 0.00038050000000000003, 'samples': 292416, 'steps': 1522, 'loss/train': 1.1130292415618896} +11/06/2021 21:29:19 - INFO - __main__ - Step 1527: {'lr': 0.0003815, 'samples': 293184, 'steps': 1526, 'loss/train': 2.968132972717285}0292415618896} +11/06/2021 21:29:19 - INFO - __main__ - Step 1527: {'lr': 0.0003815, 'samples': 293184, 'steps': 1526, 'loss/train': 2.968132972717285}0292415618896} +11/06/2021 21:29:23 - INFO - __main__ - Step 1535: {'lr': 0.0003835, 'samples': 294720, 'steps': 1534, 'loss/train': 3.5091545581817627}292415618896} +11/06/2021 21:29:25 - INFO - __main__ - Step 1539: {'lr': 0.0003845, 'samples': 295488, 'steps': 1538, 'loss/train': 3.5664308071136475}292415618896} +11/06/2021 21:29:27 - INFO - __main__ - Step 1543: {'lr': 0.0003855, 'samples': 296256, 'steps': 1542, 'loss/train': 3.427462100982666}}292415618896} +11/06/2021 21:29:29 - INFO - __main__ - Step 1548: {'lr': 0.00038675, 'samples': 297216, 'steps': 1547, 'loss/train': 3.2712979316711426}92415618896} +11/06/2021 21:29:29 - INFO - __main__ - Step 1548: {'lr': 0.00038675, 'samples': 297216, 'steps': 1547, 'loss/train': 3.2712979316711426}92415618896} +11/06/2021 21:29:29 - INFO - __main__ - Step 1548: {'lr': 0.00038675, 'samples': 297216, 'steps': 1547, 'loss/train': 3.2712979316711426}92415618896} +11/06/2021 21:29:35 - INFO - __main__ - Step 1558: {'lr': 0.00038925, 'samples': 299136, 'steps': 1557, 'loss/train': 3.1180825233459473}92415618896} +11/06/2021 21:29:37 - INFO - __main__ - Step 1564: {'lr': 0.00039075, 'samples': 300288, 'steps': 1563, 'loss/train': 3.6809487342834473}92415618896} +11/06/2021 21:29:37 - INFO - __main__ - Step 1564: {'lr': 0.00039075, 'samples': 300288, 'steps': 1563, 'loss/train': 3.6809487342834473}92415618896} +11/06/2021 21:29:41 - INFO - __main__ - Step 1571: {'lr': 0.0003925, 'samples': 301632, 'steps': 1570, 'loss/train': 2.498239040374756}3}92415618896} +11/06/2021 21:29:43 - INFO - __main__ - Step 1575: {'lr': 0.0003935, 'samples': 302400, 'steps': 1574, 'loss/train': 2.607938289642334}3}92415618896} +11/06/2021 21:29:45 - INFO - __main__ - Step 1580: {'lr': 0.00039474999999999997, 'samples': 303360, 'steps': 1579, 'loss/train': 3.356081008911133}} +11/06/2021 21:29:47 - INFO - __main__ - Step 1584: {'lr': 0.00039575, 'samples': 304128, 'steps': 1583, 'loss/train': 3.310321807861328}81008911133}} +11/06/2021 21:29:49 - INFO - __main__ - Step 1588: {'lr': 0.00039675, 'samples': 304896, 'steps': 1587, 'loss/train': 3.2099974155426025}1008911133}} +11/06/2021 21:29:51 - INFO - __main__ - Step 1592: {'lr': 0.00039775, 'samples': 305664, 'steps': 1591, 'loss/train': 2.313783884048462}}1008911133}} +11/06/2021 21:29:53 - INFO - __main__ - Step 1596: {'lr': 0.00039875, 'samples': 306432, 'steps': 1595, 'loss/train': 2.543515205383301}}1008911133}} +11/06/2021 21:29:55 - INFO - __main__ - Step 1600: {'lr': 0.00039975, 'samples': 307200, 'steps': 1599, 'loss/train': 3.1416678428649902}1008911133}} +11/06/2021 21:29:58 - INFO - __main__ - Step 1605: {'lr': 0.00040100000000000004, 'samples': 308160, 'steps': 1604, 'loss/train': 3.134627103805542}} +11/06/2021 21:29:58 - INFO - __main__ - Step 1605: {'lr': 0.00040100000000000004, 'samples': 308160, 'steps': 1604, 'loss/train': 3.134627103805542}} +11/06/2021 21:30:01 - INFO - __main__ - Step 1612: {'lr': 0.00040275, 'samples': 309504, 'steps': 1611, 'loss/train': 3.279484987258911}27103805542}} +11/06/2021 21:30:03 - INFO - __main__ - Step 1616: {'lr': 0.00040375000000000003, 'samples': 310272, 'steps': 1615, 'loss/train': 2.6593739986419678} +11/06/2021 21:30:05 - INFO - __main__ - Step 1621: {'lr': 0.00040500000000000003, 'samples': 311232, 'steps': 1620, 'loss/train': 3.027345657348633}} +11/06/2021 21:30:05 - INFO - __main__ - Step 1621: {'lr': 0.00040500000000000003, 'samples': 311232, 'steps': 1620, 'loss/train': 3.027345657348633}} +11/06/2021 21:30:09 - INFO - __main__ - Step 1629: {'lr': 0.00040699999999999997, 'samples': 312768, 'steps': 1628, 'loss/train': 3.6013989448547363} +11/06/2021 21:30:11 - INFO - __main__ - Step 1633: {'lr': 0.000408, 'samples': 313536, 'steps': 1632, 'loss/train': 2.9736287593841553}3989448547363} +11/06/2021 21:30:13 - INFO - __main__ - Step 1637: {'lr': 0.00040899999999999997, 'samples': 314304, 'steps': 1636, 'loss/train': 3.0355074405670166} +11/06/2021 21:30:15 - INFO - __main__ - Step 1642: {'lr': 0.00041025, 'samples': 315264, 'steps': 1641, 'loss/train': 2.085822105407715}074405670166} +11/06/2021 21:30:15 - INFO - __main__ - Step 1642: {'lr': 0.00041025, 'samples': 315264, 'steps': 1641, 'loss/train': 2.085822105407715}074405670166} +11/06/2021 21:30:19 - INFO - __main__ - Step 1649: {'lr': 0.000412, 'samples': 316608, 'steps': 1648, 'loss/train': 3.3871734142303467}}074405670166} +11/06/2021 21:30:21 - INFO - __main__ - Step 1653: {'lr': 0.000413, 'samples': 317376, 'steps': 1652, 'loss/train': 3.269364595413208}}}074405670166} +11/06/2021 21:30:24 - INFO - __main__ - Step 1659: {'lr': 0.0004145, 'samples': 318528, 'steps': 1658, 'loss/train': 3.018845558166504}}074405670166} +11/06/2021 21:30:24 - INFO - __main__ - Step 1659: {'lr': 0.0004145, 'samples': 318528, 'steps': 1658, 'loss/train': 3.018845558166504}}074405670166} +11/06/2021 21:30:27 - INFO - __main__ - Step 1665: {'lr': 0.000416, 'samples': 319680, 'steps': 1664, 'loss/train': 2.756814956665039}}}074405670166} +11/06/2021 21:30:29 - INFO - __main__ - Step 1669: {'lr': 0.000417, 'samples': 320448, 'steps': 1668, 'loss/train': 2.675729274749756}}}074405670166} +11/06/2021 21:30:31 - INFO - __main__ - Step 1674: {'lr': 0.00041825, 'samples': 321408, 'steps': 1673, 'loss/train': 3.209273338317871}074405670166} +11/06/2021 21:30:34 - INFO - __main__ - Step 1678: {'lr': 0.00041925, 'samples': 322176, 'steps': 1677, 'loss/train': 2.869393825531006}074405670166} +11/06/2021 21:30:36 - INFO - __main__ - Step 1682: {'lr': 0.00042025, 'samples': 322944, 'steps': 1681, 'loss/train': 2.867621421813965}074405670166} +11/06/2021 21:30:37 - INFO - __main__ - Step 1686: {'lr': 0.00042125, 'samples': 323712, 'steps': 1685, 'loss/train': 3.0616962909698486}74405670166} +11/06/2021 21:30:39 - INFO - __main__ - Step 1690: {'lr': 0.00042225000000000005, 'samples': 324480, 'steps': 1689, 'loss/train': 2.9707889556884766} +11/06/2021 21:30:39 - INFO - __main__ - Step 1690: {'lr': 0.00042225000000000005, 'samples': 324480, 'steps': 1689, 'loss/train': 2.9707889556884766} +11/06/2021 21:30:39 - INFO - __main__ - Step 1690: {'lr': 0.00042225000000000005, 'samples': 324480, 'steps': 1689, 'loss/train': 2.9707889556884766} +11/06/2021 21:30:45 - INFO - __main__ - Step 1702: {'lr': 0.00042525, 'samples': 326784, 'steps': 1701, 'loss/train': 2.888021469116211}889556884766} +11/06/2021 21:30:47 - INFO - __main__ - Step 1706: {'lr': 0.00042625000000000003, 'samples': 327552, 'steps': 1705, 'loss/train': 2.8724474906921387} +11/06/2021 21:30:50 - INFO - __main__ - Step 1711: {'lr': 0.0004275, 'samples': 328512, 'steps': 1710, 'loss/train': 3.4125115871429443}474906921387} +11/06/2021 21:30:52 - INFO - __main__ - Step 1715: {'lr': 0.0004285, 'samples': 329280, 'steps': 1714, 'loss/train': 3.073770046234131}}474906921387} +11/06/2021 21:30:54 - INFO - __main__ - Step 1719: {'lr': 0.0004295, 'samples': 330048, 'steps': 1718, 'loss/train': 3.0501821041107178}474906921387} +11/06/2021 21:30:55 - INFO - __main__ - Step 1723: {'lr': 0.0004305, 'samples': 330816, 'steps': 1722, 'loss/train': 2.9833667278289795}474906921387} +11/06/2021 21:30:57 - INFO - __main__ - Step 1727: {'lr': 0.0004315, 'samples': 331584, 'steps': 1726, 'loss/train': 2.6767044067382812}474906921387} +11/06/2021 21:31:00 - INFO - __main__ - Step 1732: {'lr': 0.00043275000000000003, 'samples': 332544, 'steps': 1731, 'loss/train': 3.1521098613739014} +11/06/2021 21:31:02 - INFO - __main__ - Step 1736: {'lr': 0.00043375000000000005, 'samples': 333312, 'steps': 1735, 'loss/train': 2.645113945007324}} +11/06/2021 21:31:04 - INFO - __main__ - Step 1740: {'lr': 0.00043475, 'samples': 334080, 'steps': 1739, 'loss/train': 2.9333367347717285}3945007324}} +11/06/2021 21:31:05 - INFO - __main__ - Step 1744: {'lr': 0.00043575000000000005, 'samples': 334848, 'steps': 1743, 'loss/train': 2.652301788330078}} +11/06/2021 21:31:07 - INFO - __main__ - Step 1748: {'lr': 0.00043675, 'samples': 335616, 'steps': 1747, 'loss/train': 2.979066848754883}01788330078}} +11/06/2021 21:31:10 - INFO - __main__ - Step 1753: {'lr': 0.000438, 'samples': 336576, 'steps': 1752, 'loss/train': 2.3090498447418213}}01788330078}} +11/06/2021 21:31:12 - INFO - __main__ - Step 1757: {'lr': 0.000439, 'samples': 337344, 'steps': 1756, 'loss/train': 3.583254337310791}}}01788330078}} +11/06/2021 21:31:14 - INFO - __main__ - Step 1761: {'lr': 0.00044, 'samples': 338112, 'steps': 1760, 'loss/train': 2.958988904953003}}}}01788330078}} +11/06/2021 21:31:16 - INFO - __main__ - Step 1765: {'lr': 0.000441, 'samples': 338880, 'steps': 1764, 'loss/train': 2.26016902923584}}}}01788330078}} +11/06/2021 21:31:17 - INFO - __main__ - Step 1769: {'lr': 0.000442, 'samples': 339648, 'steps': 1768, 'loss/train': 3.196798086166382}}}01788330078}} +11/06/2021 21:31:19 - INFO - __main__ - Step 1773: {'lr': 0.00044300000000000003, 'samples': 340416, 'steps': 1772, 'loss/train': 2.7474842071533203} +11/06/2021 21:31:22 - INFO - __main__ - Step 1778: {'lr': 0.00044425, 'samples': 341376, 'steps': 1777, 'loss/train': 1.8993228673934937}42071533203} +11/06/2021 21:31:24 - INFO - __main__ - Step 1782: {'lr': 0.00044525, 'samples': 342144, 'steps': 1781, 'loss/train': 3.134248971939087}}42071533203} +11/06/2021 21:31:26 - INFO - __main__ - Step 1786: {'lr': 0.00044625, 'samples': 342912, 'steps': 1785, 'loss/train': 1.7093374729156494}42071533203} +11/06/2021 21:31:27 - INFO - __main__ - Step 1790: {'lr': 0.00044725, 'samples': 343680, 'steps': 1789, 'loss/train': 2.685868263244629}}42071533203} +11/06/2021 21:31:29 - INFO - __main__ - Step 1794: {'lr': 0.00044824999999999997, 'samples': 344448, 'steps': 1793, 'loss/train': 2.5539019107818604} +11/06/2021 21:31:32 - INFO - __main__ - Step 1799: {'lr': 0.00044950000000000003, 'samples': 345408, 'steps': 1798, 'loss/train': 2.5512850284576416} +11/06/2021 21:31:34 - INFO - __main__ - Step 1803: {'lr': 0.0004505, 'samples': 346176, 'steps': 1802, 'loss/train': 3.1000237464904785}850284576416} +11/06/2021 21:31:36 - INFO - __main__ - Step 1807: {'lr': 0.0004515, 'samples': 346944, 'steps': 1806, 'loss/train': 2.2962563037872314}850284576416} +11/06/2021 21:31:36 - INFO - __main__ - Step 1807: {'lr': 0.0004515, 'samples': 346944, 'steps': 1806, 'loss/train': 2.2962563037872314}850284576416} +11/06/2021 21:31:39 - INFO - __main__ - Step 1814: {'lr': 0.00045325, 'samples': 348288, 'steps': 1813, 'loss/train': 3.2586300373077393}50284576416} +11/06/2021 21:31:42 - INFO - __main__ - Step 1820: {'lr': 0.00045475, 'samples': 349440, 'steps': 1819, 'loss/train': 2.775869846343994}}50284576416} +11/06/2021 21:31:42 - INFO - __main__ - Step 1820: {'lr': 0.00045475, 'samples': 349440, 'steps': 1819, 'loss/train': 2.775869846343994}}50284576416} +11/06/2021 21:31:45 - INFO - __main__ - Step 1827: {'lr': 0.00045650000000000004, 'samples': 350784, 'steps': 1826, 'loss/train': 2.706651210784912}} +11/06/2021 21:31:48 - INFO - __main__ - Step 1831: {'lr': 0.0004575, 'samples': 351552, 'steps': 1830, 'loss/train': 3.1444313526153564}51210784912}} +11/06/2021 21:31:48 - INFO - __main__ - Step 1831: {'lr': 0.0004575, 'samples': 351552, 'steps': 1830, 'loss/train': 3.1444313526153564}51210784912}} +11/06/2021 21:31:52 - INFO - __main__ - Step 1839: {'lr': 0.00045950000000000006, 'samples': 353088, 'steps': 1838, 'loss/train': 3.515568971633911}} +11/06/2021 21:31:53 - INFO - __main__ - Step 1843: {'lr': 0.0004605, 'samples': 353856, 'steps': 1842, 'loss/train': 2.9142487049102783}68971633911}} +11/06/2021 21:31:55 - INFO - __main__ - Step 1847: {'lr': 0.00046150000000000005, 'samples': 354624, 'steps': 1846, 'loss/train': 3.0182647705078125} +11/06/2021 21:31:58 - INFO - __main__ - Step 1852: {'lr': 0.00046275, 'samples': 355584, 'steps': 1851, 'loss/train': 2.291944980621338}647705078125} +11/06/2021 21:31:58 - INFO - __main__ - Step 1852: {'lr': 0.00046275, 'samples': 355584, 'steps': 1851, 'loss/train': 2.291944980621338}647705078125} +11/06/2021 21:31:58 - INFO - __main__ - Step 1852: {'lr': 0.00046275, 'samples': 355584, 'steps': 1851, 'loss/train': 2.291944980621338}647705078125} +11/06/2021 21:32:03 - INFO - __main__ - Step 1863: {'lr': 0.00046550000000000004, 'samples': 357696, 'steps': 1862, 'loss/train': 2.8213651180267334} +11/06/2021 21:32:05 - INFO - __main__ - Step 1868: {'lr': 0.00046675, 'samples': 358656, 'steps': 1867, 'loss/train': 2.391618013381958}651180267334} +11/06/2021 21:32:05 - INFO - __main__ - Step 1868: {'lr': 0.00046675, 'samples': 358656, 'steps': 1867, 'loss/train': 2.391618013381958}651180267334} +11/06/2021 21:32:05 - INFO - __main__ - Step 1868: {'lr': 0.00046675, 'samples': 358656, 'steps': 1867, 'loss/train': 2.391618013381958}651180267334} +11/06/2021 21:32:11 - INFO - __main__ - Step 1879: {'lr': 0.0004695, 'samples': 360768, 'steps': 1878, 'loss/train': 2.863210916519165}}651180267334} +11/06/2021 21:32:13 - INFO - __main__ - Step 1884: {'lr': 0.00047075000000000003, 'samples': 361728, 'steps': 1883, 'loss/train': 2.5549018383026123} +11/06/2021 21:32:13 - INFO - __main__ - Step 1884: {'lr': 0.00047075000000000003, 'samples': 361728, 'steps': 1883, 'loss/train': 2.5549018383026123} +11/06/2021 21:32:18 - INFO - __main__ - Step 1892: {'lr': 0.00047275, 'samples': 363264, 'steps': 1891, 'loss/train': 2.8816325664520264}18383026123} +11/06/2021 21:32:19 - INFO - __main__ - Step 1896: {'lr': 0.00047375, 'samples': 364032, 'steps': 1895, 'loss/train': 2.8144490718841553}18383026123} +11/06/2021 21:32:21 - INFO - __main__ - Step 1900: {'lr': 0.00047475, 'samples': 364800, 'steps': 1899, 'loss/train': 3.1232104301452637}18383026123} +11/06/2021 21:32:24 - INFO - __main__ - Step 1905: {'lr': 0.00047599999999999997, 'samples': 365760, 'steps': 1904, 'loss/train': 2.754312515258789}} +11/06/2021 21:32:26 - INFO - __main__ - Step 1909: {'lr': 0.000477, 'samples': 366528, 'steps': 1908, 'loss/train': 3.0879056453704834}312515258789}} +11/06/2021 21:32:26 - INFO - __main__ - Step 1909: {'lr': 0.000477, 'samples': 366528, 'steps': 1908, 'loss/train': 3.0879056453704834}312515258789}} +11/06/2021 21:32:30 - INFO - __main__ - Step 1917: {'lr': 0.000479, 'samples': 368064, 'steps': 1916, 'loss/train': 2.7934629917144775}312515258789}} +11/06/2021 21:32:31 - INFO - __main__ - Step 1921: {'lr': 0.00048, 'samples': 368832, 'steps': 1920, 'loss/train': 4.627929210662842}5}312515258789}} +11/06/2021 21:32:33 - INFO - __main__ - Step 1925: {'lr': 0.000481, 'samples': 369600, 'steps': 1924, 'loss/train': 2.7547266483306885}312515258789}} +11/06/2021 21:32:36 - INFO - __main__ - Step 1930: {'lr': 0.00048225000000000004, 'samples': 370560, 'steps': 1929, 'loss/train': 3.3702750205993652} +11/06/2021 21:32:38 - INFO - __main__ - Step 1934: {'lr': 0.00048325, 'samples': 371328, 'steps': 1933, 'loss/train': 1.854628324508667}750205993652} +11/06/2021 21:32:40 - INFO - __main__ - Step 1938: {'lr': 0.00048425000000000003, 'samples': 372096, 'steps': 1937, 'loss/train': 2.217445135116577}} +11/06/2021 21:32:41 - INFO - __main__ - Step 1942: {'lr': 0.00048525, 'samples': 372864, 'steps': 1941, 'loss/train': 2.725562334060669}45135116577}} +11/06/2021 21:32:43 - INFO - __main__ - Step 1946: {'lr': 0.00048625000000000003, 'samples': 373632, 'steps': 1945, 'loss/train': 2.831516981124878}} +11/06/2021 21:32:46 - INFO - __main__ - Step 1951: {'lr': 0.0004875, 'samples': 374592, 'steps': 1950, 'loss/train': 3.081878900527954}516981124878}} +11/06/2021 21:32:48 - INFO - __main__ - Step 1956: {'lr': 0.00048875, 'samples': 375552, 'steps': 1955, 'loss/train': 2.585529327392578}16981124878}} +11/06/2021 21:32:50 - INFO - __main__ - Step 1960: {'lr': 0.0004897500000000001, 'samples': 376320, 'steps': 1959, 'loss/train': 2.583451986312866}}} +11/06/2021 21:32:50 - INFO - __main__ - Step 1960: {'lr': 0.0004897500000000001, 'samples': 376320, 'steps': 1959, 'loss/train': 2.583451986312866}}} +11/06/2021 21:32:54 - INFO - __main__ - Step 1967: {'lr': 0.0004915, 'samples': 377664, 'steps': 1966, 'loss/train': 3.0170748233795166}1986312866}}} +11/06/2021 21:32:56 - INFO - __main__ - Step 1972: {'lr': 0.00049275, 'samples': 378624, 'steps': 1971, 'loss/train': 2.834716796875}66}1986312866}}} +11/06/2021 21:32:58 - INFO - __main__ - Step 1977: {'lr': 0.000494, 'samples': 379584, 'steps': 1976, 'loss/train': 2.7673490047454834}}1986312866}}} +11/06/2021 21:33:00 - INFO - __main__ - Step 1981: {'lr': 0.000495, 'samples': 380352, 'steps': 1980, 'loss/train': 2.695145845413208}}}1986312866}}} +11/06/2021 21:33:03 - INFO - __main__ - Step 1985: {'lr': 0.000496, 'samples': 381120, 'steps': 1984, 'loss/train': 2.6449930667877197}}1986312866}}} +11/06/2021 21:33:04 - INFO - __main__ - Step 1989: {'lr': 0.000497, 'samples': 381888, 'steps': 1988, 'loss/train': 2.3569090366363525}}1986312866}}} +11/06/2021 21:33:06 - INFO - __main__ - Step 1993: {'lr': 0.000498, 'samples': 382656, 'steps': 1992, 'loss/train': 2.463730573654175}}}1986312866}}} +11/06/2021 21:33:08 - INFO - __main__ - Step 1998: {'lr': 0.00049925, 'samples': 383616, 'steps': 1997, 'loss/train': 2.460160970687866}1986312866}}} +11/06/2021 21:33:10 - INFO - __main__ - Step 2002: {'lr': 0.0004999999999436769, 'samples': 384384, 'steps': 2001, 'loss/train': 2.369316816329956}}} +11/06/2021 21:33:13 - INFO - __main__ - Step 2006: {'lr': 0.0004999999985919232, 'samples': 385152, 'steps': 2005, 'loss/train': 2.7397634983062744}} +11/06/2021 21:33:14 - INFO - __main__ - Step 2010: {'lr': 0.0004999999954378312, 'samples': 385920, 'steps': 2009, 'loss/train': 2.108156681060791}}} +11/06/2021 21:33:16 - INFO - __main__ - Step 2014: {'lr': 0.000499999990481401, 'samples': 386688, 'steps': 2013, 'loss/train': 2.6608567237854004}}} +11/06/2021 21:33:18 - INFO - __main__ - Step 2018: {'lr': 0.0004999999837226326, 'samples': 387456, 'steps': 2017, 'loss/train': 2.4174294471740723}} +11/06/2021 21:33:20 - INFO - __main__ - Step 2022: {'lr': 0.0004999999751615261, 'samples': 388224, 'steps': 2021, 'loss/train': 2.4763200283050537}} +11/06/2021 21:33:22 - INFO - __main__ - Step 2026: {'lr': 0.0004999999647980814, 'samples': 388992, 'steps': 2025, 'loss/train': 2.2224512100219727}} +11/06/2021 21:33:24 - INFO - __main__ - Step 2030: {'lr': 0.0004999999526322987, 'samples': 389760, 'steps': 2029, 'loss/train': 2.9428741931915283}} +11/06/2021 21:33:26 - INFO - __main__ - Step 2035: {'lr': 0.0004999999348905326, 'samples': 390720, 'steps': 2034, 'loss/train': 2.2460341453552246}} +11/06/2021 21:33:28 - INFO - __main__ - Step 2039: {'lr': 0.0004999999186694897, 'samples': 391488, 'steps': 2038, 'loss/train': 2.7766733169555664}} +11/06/2021 21:33:30 - INFO - __main__ - Step 2043: {'lr': 0.0004999999006461091, 'samples': 392256, 'steps': 2042, 'loss/train': 2.7250239849090576}} +11/06/2021 21:33:30 - INFO - __main__ - Step 2043: {'lr': 0.0004999999006461091, 'samples': 392256, 'steps': 2042, 'loss/train': 2.7250239849090576}} +11/06/2021 21:33:34 - INFO - __main__ - Step 2050: {'lr': 0.0004999998647683184, 'samples': 393600, 'steps': 2049, 'loss/train': 2.4513065814971924}} +11/06/2021 21:33:36 - INFO - __main__ - Step 2056: {'lr': 0.0004999998296227291, 'samples': 394752, 'steps': 2055, 'loss/train': 2.863607168197632}}} +11/06/2021 21:33:36 - INFO - __main__ - Step 2056: {'lr': 0.0004999998296227291, 'samples': 394752, 'steps': 2055, 'loss/train': 2.863607168197632}}} +11/06/2021 21:33:40 - INFO - __main__ - Step 2063: {'lr': 0.0004999997834941459, 'samples': 396096, 'steps': 2062, 'loss/train': 3.102501153945923}}} +11/06/2021 21:33:42 - INFO - __main__ - Step 2067: {'lr': 0.0004999997546567423, 'samples': 396864, 'steps': 2066, 'loss/train': 2.925659418106079}}} +11/06/2021 21:33:44 - INFO - __main__ - Step 2072: {'lr': 0.0004999997160754522, 'samples': 397824, 'steps': 2071, 'loss/train': 2.0112996101379395}} +11/06/2021 21:33:46 - INFO - __main__ - Step 2076: {'lr': 0.0004999996831827918, 'samples': 398592, 'steps': 2075, 'loss/train': 2.0490965843200684}} +11/06/2021 21:33:48 - INFO - __main__ - Step 2080: {'lr': 0.0004999996484877955, 'samples': 399360, 'steps': 2079, 'loss/train': 2.834831953048706}}} +11/06/2021 21:33:50 - INFO - __main__ - Step 2084: {'lr': 0.0004999996119904633, 'samples': 400128, 'steps': 2083, 'loss/train': 2.5453062057495117}} +11/06/2021 21:33:52 - INFO - __main__ - Step 2088: {'lr': 0.0004999995736907957, 'samples': 400896, 'steps': 2087, 'loss/train': 2.4093174934387207}} +11/06/2021 21:33:54 - INFO - __main__ - Step 2093: {'lr': 0.0004999995232816774, 'samples': 401856, 'steps': 2092, 'loss/train': 2.0404558181762695}} +11/06/2021 21:33:57 - INFO - __main__ - Step 2098: {'lr': 0.0004999994700564109, 'samples': 402816, 'steps': 2097, 'loss/train': 2.6748390197753906}} +11/06/2021 21:33:57 - INFO - __main__ - Step 2098: {'lr': 0.0004999994700564109, 'samples': 402816, 'steps': 2097, 'loss/train': 2.6748390197753906}} +11/06/2021 21:34:00 - INFO - __main__ - Step 2105: {'lr': 0.00049999939080991, 'samples': 404160, 'steps': 2104, 'loss/train': 1.7636381387710571}6}} +11/06/2021 21:34:02 - INFO - __main__ - Step 2109: {'lr': 0.000499999343047986, 'samples': 404928, 'steps': 2108, 'loss/train': 2.693075180053711}6}} +11/06/2021 21:34:04 - INFO - __main__ - Step 2114: {'lr': 0.0004999992808110495, 'samples': 405888, 'steps': 2113, 'loss/train': 2.4178295135498047}} +11/06/2021 21:34:04 - INFO - __main__ - Step 2114: {'lr': 0.0004999992808110495, 'samples': 405888, 'steps': 2113, 'loss/train': 2.4178295135498047}} +11/06/2021 21:34:08 - INFO - __main__ - Step 2122: {'lr': 0.0004999991753743689, 'samples': 407424, 'steps': 2121, 'loss/train': 2.5452983379364014}} +11/06/2021 21:34:10 - INFO - __main__ - Step 2126: {'lr': 0.0004999991199525299, 'samples': 408192, 'steps': 2125, 'loss/train': 2.357633113861084}}} +11/06/2021 21:34:12 - INFO - __main__ - Step 2130: {'lr': 0.000499999062728359, 'samples': 408960, 'steps': 2129, 'loss/train': 2.727692127227783}}}} +11/06/2021 21:34:14 - INFO - __main__ - Step 2135: {'lr': 0.0004999989886636166, 'samples': 409920, 'steps': 2134, 'loss/train': 2.996830463409424}}} +11/06/2021 21:34:14 - INFO - __main__ - Step 2135: {'lr': 0.0004999989886636166, 'samples': 409920, 'steps': 2134, 'loss/train': 2.996830463409424}}} +11/06/2021 21:34:18 - INFO - __main__ - Step 2142: {'lr': 0.0004999988802418587, 'samples': 411264, 'steps': 2141, 'loss/train': 2.5951883792877197}} +11/06/2021 21:34:20 - INFO - __main__ - Step 2146: {'lr': 0.0004999988158083643, 'samples': 412032, 'steps': 2145, 'loss/train': 2.607226848602295}}} +11/06/2021 21:34:22 - INFO - __main__ - Step 2151: {'lr': 0.0004999987327319701, 'samples': 412992, 'steps': 2150, 'loss/train': 2.9837472438812256}} +11/06/2021 21:34:25 - INFO - __main__ - Step 2156: {'lr': 0.0004999986468394367, 'samples': 413952, 'steps': 2155, 'loss/train': 2.50052547454834}6}} +11/06/2021 21:34:27 - INFO - __main__ - Step 2160: {'lr': 0.0004999985760977903, 'samples': 414720, 'steps': 2159, 'loss/train': 2.2128641605377197}} +11/06/2021 21:34:27 - INFO - __main__ - Step 2160: {'lr': 0.0004999985760977903, 'samples': 414720, 'steps': 2159, 'loss/train': 2.2128641605377197}} +11/06/2021 21:34:30 - INFO - __main__ - Step 2167: {'lr': 0.0004999984479630577, 'samples': 416064, 'steps': 2166, 'loss/train': 2.6970345973968506}} +11/06/2021 21:34:32 - INFO - __main__ - Step 2172: {'lr': 0.0004999983530588853, 'samples': 417024, 'steps': 2171, 'loss/train': 2.061142921447754}}} +11/06/2021 21:34:35 - INFO - __main__ - Step 2177: {'lr': 0.0004999982553385778, 'samples': 417984, 'steps': 2176, 'loss/train': 2.5779266357421875}} +11/06/2021 21:34:35 - INFO - __main__ - Step 2177: {'lr': 0.0004999982553385778, 'samples': 417984, 'steps': 2176, 'loss/train': 2.5779266357421875}} +11/06/2021 21:34:38 - INFO - __main__ - Step 2184: {'lr': 0.0004999981137990425, 'samples': 419328, 'steps': 2183, 'loss/train': 3.1171112060546875}} +11/06/2021 21:34:40 - INFO - __main__ - Step 2188: {'lr': 0.0004999980304411116, 'samples': 420096, 'steps': 2187, 'loss/train': 2.344801902770996}}} +11/06/2021 21:34:43 - INFO - __main__ - Step 2194: {'lr': 0.0004999979020248577, 'samples': 421248, 'steps': 2193, 'loss/train': 2.4983091354370117}} +11/06/2021 21:34:43 - INFO - __main__ - Step 2194: {'lr': 0.0004999979020248577, 'samples': 421248, 'steps': 2193, 'loss/train': 2.4983091354370117}} +11/06/2021 21:34:47 - INFO - __main__ - Step 2201: {'lr': 0.0004999977470805383, 'samples': 422592, 'steps': 2200, 'loss/train': 2.3798577785491943}} +11/06/2021 21:34:48 - INFO - __main__ - Step 2205: {'lr': 0.0004999976560627344, 'samples': 423360, 'steps': 2204, 'loss/train': 2.8710994720458984}} +11/06/2021 21:34:50 - INFO - __main__ - Step 2209: {'lr': 0.000499997563242609, 'samples': 424128, 'steps': 2208, 'loss/train': 2.5492539405822754}}} +11/06/2021 21:34:53 - INFO - __main__ - Step 2214: {'lr': 0.0004999974446829389, 'samples': 425088, 'steps': 2213, 'loss/train': 2.4633007049560547}} +11/06/2021 21:34:55 - INFO - __main__ - Step 2218: {'lr': 0.0004999973478075928, 'samples': 425856, 'steps': 2217, 'loss/train': 2.6798555850982666}} +11/06/2021 21:34:57 - INFO - __main__ - Step 2222: {'lr': 0.0004999972491299276, 'samples': 426624, 'steps': 2221, 'loss/train': 2.5645909309387207}} +11/06/2021 21:34:58 - INFO - __main__ - Step 2226: {'lr': 0.000499997148649944, 'samples': 427392, 'steps': 2225, 'loss/train': 2.6324121952056885}}} +11/06/2021 21:35:00 - INFO - __main__ - Step 2230: {'lr': 0.0004999970463676427, 'samples': 428160, 'steps': 2229, 'loss/train': 2.492368221282959}}} +11/06/2021 21:35:03 - INFO - __main__ - Step 2235: {'lr': 0.0004999969159802577, 'samples': 429120, 'steps': 2234, 'loss/train': 2.6638810634613037}} +11/06/2021 21:35:05 - INFO - __main__ - Step 2239: {'lr': 0.0004999968096427443, 'samples': 429888, 'steps': 2238, 'loss/train': 1.956204891204834}}} +11/06/2021 21:35:07 - INFO - __main__ - Step 2243: {'lr': 0.0004999967015029155, 'samples': 430656, 'steps': 2242, 'loss/train': 2.4464919567108154}} +11/06/2021 21:35:08 - INFO - __main__ - Step 2247: {'lr': 0.0004999965915607722, 'samples': 431424, 'steps': 2246, 'loss/train': 1.3028373718261719}} +11/06/2021 21:35:10 - INFO - __main__ - Step 2251: {'lr': 0.0004999964798163152, 'samples': 432192, 'steps': 2250, 'loss/train': 2.384847640991211}}} +11/06/2021 21:35:13 - INFO - __main__ - Step 2256: {'lr': 0.0004999963376012416, 'samples': 433152, 'steps': 2255, 'loss/train': 2.2551157474517822}} +11/06/2021 21:35:13 - INFO - __main__ - Step 2256: {'lr': 0.0004999963376012416, 'samples': 433152, 'steps': 2255, 'loss/train': 2.2551157474517822}} +11/06/2021 21:35:17 - INFO - __main__ - Step 2264: {'lr': 0.0004999961041996109, 'samples': 434688, 'steps': 2263, 'loss/train': 2.3833937644958496}} +11/06/2021 21:35:18 - INFO - __main__ - Step 2268: {'lr': 0.0004999959847953299, 'samples': 435456, 'steps': 2267, 'loss/train': 1.9739242792129517}} +11/06/2021 21:35:20 - INFO - __main__ - Step 2272: {'lr': 0.0004999958635887394, 'samples': 436224, 'steps': 2271, 'loss/train': 2.7278921604156494}} +11/06/2021 21:35:23 - INFO - __main__ - Step 2278: {'lr': 0.0004999956783995257, 'samples': 437376, 'steps': 2277, 'loss/train': 2.585498809814453}}} +11/06/2021 21:35:25 - INFO - __main__ - Step 2282: {'lr': 0.0004999955526871659, 'samples': 438144, 'steps': 2281, 'loss/train': 1.7193819284439087}} +11/06/2021 21:35:27 - INFO - __main__ - Step 2286: {'lr': 0.0004999954251724999, 'samples': 438912, 'steps': 2285, 'loss/train': 2.635653495788574}}} +11/06/2021 21:35:27 - INFO - __main__ - Step 2286: {'lr': 0.0004999954251724999, 'samples': 438912, 'steps': 2285, 'loss/train': 2.635653495788574}}} +11/06/2021 21:35:31 - INFO - __main__ - Step 2293: {'lr': 0.0004999951976850377, 'samples': 440256, 'steps': 2292, 'loss/train': 1.871019721031189}}} +11/06/2021 21:35:33 - INFO - __main__ - Step 2298: {'lr': 0.0004999950318146737, 'samples': 441216, 'steps': 2297, 'loss/train': 2.5910117626190186}} +11/06/2021 21:35:35 - INFO - __main__ - Step 2302: {'lr': 0.0004999948970907921, 'samples': 441984, 'steps': 2301, 'loss/train': 2.345691442489624}}} +11/06/2021 21:35:35 - INFO - __main__ - Step 2302: {'lr': 0.0004999948970907921, 'samples': 441984, 'steps': 2301, 'loss/train': 2.345691442489624}}} +11/06/2021 21:35:38 - INFO - __main__ - Step 2309: {'lr': 0.0004999946569872118, 'samples': 443328, 'steps': 2308, 'loss/train': 2.174234628677368}}} +11/06/2021 21:35:41 - INFO - __main__ - Step 2314: {'lr': 0.0004999944821053422, 'samples': 444288, 'steps': 2313, 'loss/train': 2.653313636779785}}} +11/06/2021 21:35:43 - INFO - __main__ - Step 2319: {'lr': 0.0004999943044073813, 'samples': 445248, 'steps': 2318, 'loss/train': 2.925724983215332}}} +11/06/2021 21:35:45 - INFO - __main__ - Step 2323: {'lr': 0.000499994160221428, 'samples': 446016, 'steps': 2322, 'loss/train': 2.5466785430908203}}} +11/06/2021 21:35:45 - INFO - __main__ - Step 2323: {'lr': 0.000499994160221428, 'samples': 446016, 'steps': 2322, 'loss/train': 2.5466785430908203}}} +11/06/2021 21:35:49 - INFO - __main__ - Step 2330: {'lr': 0.0004999939035592351, 'samples': 447360, 'steps': 2329, 'loss/train': 1.2856340408325195}} +11/06/2021 21:35:51 - INFO - __main__ - Step 2335: {'lr': 0.0004999937168497954, 'samples': 448320, 'steps': 2334, 'loss/train': 2.982269763946533}}} +11/06/2021 21:35:53 - INFO - __main__ - Step 2339: {'lr': 0.0004999935654546638, 'samples': 449088, 'steps': 2338, 'loss/train': 2.4741744995117188}} +11/06/2021 21:35:53 - INFO - __main__ - Step 2339: {'lr': 0.0004999935654546638, 'samples': 449088, 'steps': 2338, 'loss/train': 2.4741744995117188}} +11/06/2021 21:35:57 - INFO - __main__ - Step 2346: {'lr': 0.0004999932961764192, 'samples': 450432, 'steps': 2345, 'loss/train': 2.2040252685546875}} +11/06/2021 21:35:59 - INFO - __main__ - Step 2350: {'lr': 0.0004999931398249876, 'samples': 451200, 'steps': 2349, 'loss/train': 1.3503772020339966}} +11/06/2021 21:36:01 - INFO - __main__ - Step 2355: {'lr': 0.0004999929418512296, 'samples': 452160, 'steps': 2354, 'loss/train': 2.645233392715454}}} +11/06/2021 21:36:03 - INFO - __main__ - Step 2359: {'lr': 0.0004999927814446498, 'samples': 452928, 'steps': 2358, 'loss/train': 2.382434844970703}}} +11/06/2021 21:36:05 - INFO - __main__ - Step 2363: {'lr': 0.0004999926192357836, 'samples': 453696, 'steps': 2362, 'loss/train': 2.667649269104004}}} +11/06/2021 21:36:07 - INFO - __main__ - Step 2367: {'lr': 0.0004999924552246324, 'samples': 454464, 'steps': 2366, 'loss/train': 2.5451650619506836}} +11/06/2021 21:36:09 - INFO - __main__ - Step 2371: {'lr': 0.0004999922894111975, 'samples': 455232, 'steps': 2370, 'loss/train': 2.5309088230133057}} +11/06/2021 21:36:11 - INFO - __main__ - Step 2376: {'lr': 0.0004999920796099437, 'samples': 456192, 'steps': 2375, 'loss/train': 2.113866090774536}}} +11/06/2021 21:36:13 - INFO - __main__ - Step 2380: {'lr': 0.0004999919097413743, 'samples': 456960, 'steps': 2379, 'loss/train': 2.0128252506256104}} +11/06/2021 21:36:16 - INFO - __main__ - Step 2384: {'lr': 0.000499991738070525, 'samples': 457728, 'steps': 2383, 'loss/train': 2.820688247680664}4}} +11/06/2021 21:36:17 - INFO - __main__ - Step 2388: {'lr': 0.000499991564597397, 'samples': 458496, 'steps': 2387, 'loss/train': 2.985884189605713}4}} +11/06/2021 21:36:19 - INFO - __main__ - Step 2392: {'lr': 0.0004999913893219915, 'samples': 459264, 'steps': 2391, 'loss/train': 2.4803824424743652}} +11/06/2021 21:36:22 - INFO - __main__ - Step 2397: {'lr': 0.0004999911676932838, 'samples': 460224, 'steps': 2396, 'loss/train': 2.7710964679718018}} +11/06/2021 21:36:24 - INFO - __main__ - Step 2401: {'lr': 0.0004999909883627587, 'samples': 460992, 'steps': 2400, 'loss/train': 2.3043596744537354}} +11/06/2021 21:36:26 - INFO - __main__ - Step 2405: {'lr': 0.0004999908072299602, 'samples': 461760, 'steps': 2404, 'loss/train': 2.4561195373535156}} +11/06/2021 21:36:26 - INFO - __main__ - Step 2405: {'lr': 0.0004999908072299602, 'samples': 461760, 'steps': 2404, 'loss/train': 2.4561195373535156}} +11/06/2021 21:36:29 - INFO - __main__ - Step 2412: {'lr': 0.0004999904859108467, 'samples': 463104, 'steps': 2411, 'loss/train': 2.3780782222747803}} +11/06/2021 21:36:31 - INFO - __main__ - Step 2417: {'lr': 0.000499990253017938, 'samples': 464064, 'steps': 2416, 'loss/train': 2.537015438079834}3}} +11/06/2021 21:36:31 - INFO - __main__ - Step 2417: {'lr': 0.000499990253017938, 'samples': 464064, 'steps': 2416, 'loss/train': 2.537015438079834}3}} +11/06/2021 21:36:35 - INFO - __main__ - Step 2425: {'lr': 0.0004999898745319145, 'samples': 465600, 'steps': 2424, 'loss/train': 2.419081449508667}}} +11/06/2021 21:36:37 - INFO - __main__ - Step 2429: {'lr': 0.000499989682585504, 'samples': 466368, 'steps': 2428, 'loss/train': 1.5299700498580933}}} +11/06/2021 21:36:39 - INFO - __main__ - Step 2434: {'lr': 0.0004999894401180576, 'samples': 467328, 'steps': 2433, 'loss/train': 2.631399631500244}}} +11/06/2021 21:36:39 - INFO - __main__ - Step 2434: {'lr': 0.0004999894401180576, 'samples': 467328, 'steps': 2433, 'loss/train': 2.631399631500244}}} +11/06/2021 21:36:44 - INFO - __main__ - Step 2442: {'lr': 0.0004999890463127924, 'samples': 468864, 'steps': 2441, 'loss/train': 2.5758795738220215}} +11/06/2021 21:36:45 - INFO - __main__ - Step 2446: {'lr': 0.0004999888467067702, 'samples': 469632, 'steps': 2445, 'loss/train': 2.458528757095337}}} +11/06/2021 21:36:47 - INFO - __main__ - Step 2450: {'lr': 0.00049998864529849, 'samples': 470400, 'steps': 2449, 'loss/train': 1.814773440361023}7}}} +11/06/2021 21:36:49 - INFO - __main__ - Step 2454: {'lr': 0.0004999884420879534, 'samples': 471168, 'steps': 2453, 'loss/train': 2.2643680572509766}} +11/06/2021 21:36:49 - INFO - __main__ - Step 2454: {'lr': 0.0004999884420879534, 'samples': 471168, 'steps': 2453, 'loss/train': 2.2643680572509766}} +11/06/2021 21:36:53 - INFO - __main__ - Step 2461: {'lr': 0.0004999880821328395, 'samples': 472512, 'steps': 2460, 'loss/train': 2.13460373878479}6}} +11/06/2021 21:36:55 - INFO - __main__ - Step 2466: {'lr': 0.0004999878216428201, 'samples': 473472, 'steps': 2465, 'loss/train': 3.099053144454956}}} +11/06/2021 21:36:57 - INFO - __main__ - Step 2470: {'lr': 0.0004999876112232726, 'samples': 474240, 'steps': 2469, 'loss/train': 2.2806897163391113}} +11/06/2021 21:36:59 - INFO - __main__ - Step 2474: {'lr': 0.0004999873990014763, 'samples': 475008, 'steps': 2473, 'loss/train': 2.296961784362793}}} +11/06/2021 21:36:59 - INFO - __main__ - Step 2474: {'lr': 0.0004999873990014763, 'samples': 475008, 'steps': 2473, 'loss/train': 2.296961784362793}}} +11/06/2021 21:37:03 - INFO - __main__ - Step 2481: {'lr': 0.0004999870232766756, 'samples': 476352, 'steps': 2480, 'loss/train': 2.6014020442962646}} +11/06/2021 21:37:05 - INFO - __main__ - Step 2486: {'lr': 0.0004999867515226088, 'samples': 477312, 'steps': 2485, 'loss/train': 2.565920829772949}}} +11/06/2021 21:37:05 - INFO - __main__ - Step 2486: {'lr': 0.0004999867515226088, 'samples': 477312, 'steps': 2485, 'loss/train': 2.565920829772949}}} +11/06/2021 21:37:09 - INFO - __main__ - Step 2494: {'lr': 0.000499986310858814, 'samples': 478848, 'steps': 2493, 'loss/train': 2.30643892288208}9}}} +11/06/2021 21:37:11 - INFO - __main__ - Step 2498: {'lr': 0.0004999860878235564, 'samples': 479616, 'steps': 2497, 'loss/train': 2.4118523597717285}} +11/06/2021 21:37:13 - INFO - __main__ - Step 2502: {'lr': 0.0004999858629860609, 'samples': 480384, 'steps': 2501, 'loss/train': 2.3400754928588867}} +11/06/2021 21:37:15 - INFO - __main__ - Step 2506: {'lr': 0.000499985636346329, 'samples': 481152, 'steps': 2505, 'loss/train': 2.2163236141204834}}} +11/06/2021 21:37:17 - INFO - __main__ - Step 2511: {'lr': 0.0004999853505122718, 'samples': 482112, 'steps': 2510, 'loss/train': 2.314603567123413}}} +11/06/2021 21:37:19 - INFO - __main__ - Step 2515: {'lr': 0.0004999851198175141, 'samples': 482880, 'steps': 2514, 'loss/train': 2.3666229248046875}} +11/06/2021 21:37:19 - INFO - __main__ - Step 2515: {'lr': 0.0004999851198175141, 'samples': 482880, 'steps': 2514, 'loss/train': 2.3666229248046875}} +11/06/2021 21:37:23 - INFO - __main__ - Step 2522: {'lr': 0.0004999847117650708, 'samples': 484224, 'steps': 2521, 'loss/train': 2.2497646808624268}} +11/06/2021 21:37:25 - INFO - __main__ - Step 2527: {'lr': 0.0004999844169198617, 'samples': 485184, 'steps': 2526, 'loss/train': 2.444234609603882}}} +11/06/2021 21:37:28 - INFO - __main__ - Step 2532: {'lr': 0.0004999841192586746, 'samples': 486144, 'steps': 2531, 'loss/train': 2.247392177581787}}} +11/06/2021 21:37:28 - INFO - __main__ - Step 2532: {'lr': 0.0004999841192586746, 'samples': 486144, 'steps': 2531, 'loss/train': 2.247392177581787}}} +11/06/2021 21:37:31 - INFO - __main__ - Step 2539: {'lr': 0.000499983697802176, 'samples': 487488, 'steps': 2538, 'loss/train': 2.763502836227417}}}} +11/06/2021 21:37:33 - INFO - __main__ - Step 2543: {'lr': 0.0004999834544918369, 'samples': 488256, 'steps': 2542, 'loss/train': 1.3541216850280762}} +11/06/2021 21:37:35 - INFO - __main__ - Step 2548: {'lr': 0.0004999831478195429, 'samples': 489216, 'steps': 2547, 'loss/train': 2.1510307788848877}} +11/06/2021 21:37:38 - INFO - __main__ - Step 2553: {'lr': 0.0004999828383312851, 'samples': 490176, 'steps': 2552, 'loss/train': 2.293485403060913}}} +11/06/2021 21:37:40 - INFO - __main__ - Step 2557: {'lr': 0.0004999825887131874, 'samples': 490944, 'steps': 2556, 'loss/train': 2.3221940994262695}} +11/06/2021 21:37:42 - INFO - __main__ - Step 2561: {'lr': 0.000499982337292877, 'samples': 491712, 'steps': 2560, 'loss/train': 2.518115758895874}5}} +11/06/2021 21:37:44 - INFO - __main__ - Step 2565: {'lr': 0.0004999820840703554, 'samples': 492480, 'steps': 2564, 'loss/train': 2.438570022583008}}} +11/06/2021 21:37:45 - INFO - __main__ - Step 2569: {'lr': 0.0004999818290456249, 'samples': 493248, 'steps': 2568, 'loss/train': 2.5977227687835693}} +11/06/2021 21:37:48 - INFO - __main__ - Step 2574: {'lr': 0.0004999815077303579, 'samples': 494208, 'steps': 2573, 'loss/train': 2.548187017440796}}} +11/06/2021 21:37:50 - INFO - __main__ - Step 2578: {'lr': 0.0004999812486506637, 'samples': 494976, 'steps': 2577, 'loss/train': 1.985874056816101}}} +11/06/2021 21:37:52 - INFO - __main__ - Step 2582: {'lr': 0.0004999809877687662, 'samples': 495744, 'steps': 2581, 'loss/train': 2.4952125549316406}} +11/06/2021 21:37:54 - INFO - __main__ - Step 2586: {'lr': 0.0004999807250846676, 'samples': 496512, 'steps': 2585, 'loss/train': 2.023077964782715}}} +11/06/2021 21:37:55 - INFO - __main__ - Step 2590: {'lr': 0.0004999804605983697, 'samples': 497280, 'steps': 2589, 'loss/train': 1.7954328060150146}} +11/06/2021 21:37:57 - INFO - __main__ - Step 2594: {'lr': 0.0004999801943098743, 'samples': 498048, 'steps': 2593, 'loss/train': 2.145956039428711}}} +11/06/2021 21:38:00 - INFO - __main__ - Step 2599: {'lr': 0.0004999798589149179, 'samples': 499008, 'steps': 2598, 'loss/train': 1.718825101852417}}} +11/06/2021 21:38:00 - INFO - __main__ - Step 2599: {'lr': 0.0004999798589149179, 'samples': 499008, 'steps': 2598, 'loss/train': 1.718825101852417}}} +11/06/2021 21:38:03 - INFO - __main__ - Step 2606: {'lr': 0.000499979384631223, 'samples': 500352, 'steps': 2605, 'loss/train': 2.426281690597534}}}} +11/06/2021 21:38:05 - INFO - __main__ - Step 2611: {'lr': 0.0004999790424780492, 'samples': 501312, 'steps': 2610, 'loss/train': 2.595461368560791}}} +11/06/2021 21:38:08 - INFO - __main__ - Step 2616: {'lr': 0.0004999786975089577, 'samples': 502272, 'steps': 2615, 'loss/train': 4.580399513244629}}} +11/06/2021 21:38:08 - INFO - __main__ - Step 2616: {'lr': 0.0004999786975089577, 'samples': 502272, 'steps': 2615, 'loss/train': 4.580399513244629}}} +11/06/2021 21:38:11 - INFO - __main__ - Step 2623: {'lr': 0.0004999782098214957, 'samples': 503616, 'steps': 2622, 'loss/train': 2.4918506145477295}} +11/06/2021 21:38:13 - INFO - __main__ - Step 2627: {'lr': 0.0004999779286649461, 'samples': 504384, 'steps': 2626, 'loss/train': 2.620913028717041}}} +11/06/2021 21:38:16 - INFO - __main__ - Step 2632: {'lr': 0.0004999775746849451, 'samples': 505344, 'steps': 2631, 'loss/train': 1.9219590425491333}} +11/06/2021 21:38:18 - INFO - __main__ - Step 2636: {'lr': 0.0004999772894734954, 'samples': 506112, 'steps': 2635, 'loss/train': 1.6440210342407227}} +11/06/2021 21:38:20 - INFO - __main__ - Step 2640: {'lr': 0.0004999770024598711, 'samples': 506880, 'steps': 2639, 'loss/train': 2.848144054412842}}} +11/06/2021 21:38:22 - INFO - __main__ - Step 2644: {'lr': 0.0004999767136440742, 'samples': 507648, 'steps': 2643, 'loss/train': 2.4299545288085938}} +11/06/2021 21:38:23 - INFO - __main__ - Step 2648: {'lr': 0.0004999764230261072, 'samples': 508416, 'steps': 2647, 'loss/train': 2.69739031791687}8}} +11/06/2021 21:38:26 - INFO - __main__ - Step 2653: {'lr': 0.0004999760572193492, 'samples': 509376, 'steps': 2652, 'loss/train': 2.0966432094573975}} +11/06/2021 21:38:28 - INFO - __main__ - Step 2657: {'lr': 0.0004999757625465063, 'samples': 510144, 'steps': 2656, 'loss/train': 1.6061630249023438}} +11/06/2021 21:38:30 - INFO - __main__ - Step 2661: {'lr': 0.0004999754660714999, 'samples': 510912, 'steps': 2660, 'loss/train': 2.1438426971435547}} +11/06/2021 21:38:32 - INFO - __main__ - Step 2665: {'lr': 0.0004999751677943322, 'samples': 511680, 'steps': 2664, 'loss/train': 1.7713021039962769}} +11/06/2021 21:38:33 - INFO - __main__ - Step 2669: {'lr': 0.0004999748677150051, 'samples': 512448, 'steps': 2668, 'loss/train': 2.6738812923431396}} +11/06/2021 21:38:35 - INFO - __main__ - Step 2673: {'lr': 0.0004999745658335209, 'samples': 513216, 'steps': 2672, 'loss/train': 2.6007511615753174}} +11/06/2021 21:38:38 - INFO - __main__ - Step 2678: {'lr': 0.0004999741859473857, 'samples': 514176, 'steps': 2677, 'loss/train': 2.3065757751464844}} +11/06/2021 21:38:38 - INFO - __main__ - Step 2678: {'lr': 0.0004999741859473857, 'samples': 514176, 'steps': 2677, 'loss/train': 2.3065757751464844}} +11/06/2021 21:38:41 - INFO - __main__ - Step 2685: {'lr': 0.0004999736493761477, 'samples': 515520, 'steps': 2684, 'loss/train': 2.4622879028320312}} +11/06/2021 21:38:43 - INFO - __main__ - Step 2689: {'lr': 0.0004999733402860572, 'samples': 516288, 'steps': 2688, 'loss/train': 2.6095635890960693}} +11/06/2021 21:38:46 - INFO - __main__ - Step 2694: {'lr': 0.0004999729513891762, 'samples': 517248, 'steps': 2693, 'loss/train': 2.7909016609191895}} +11/06/2021 21:38:48 - INFO - __main__ - Step 2698: {'lr': 0.0004999726382442601, 'samples': 518016, 'steps': 2697, 'loss/train': 1.9356613159179688}} +11/06/2021 21:38:48 - INFO - __main__ - Step 2698: {'lr': 0.0004999726382442601, 'samples': 518016, 'steps': 2697, 'loss/train': 1.9356613159179688}} +11/06/2021 21:38:52 - INFO - __main__ - Step 2705: {'lr': 0.0004999720859042565, 'samples': 519360, 'steps': 2704, 'loss/train': 2.2500193119049072}} +11/06/2021 21:38:54 - INFO - __main__ - Step 2710: {'lr': 0.0004999716879966747, 'samples': 520320, 'steps': 2709, 'loss/train': 2.6745805740356445}} +11/06/2021 21:38:56 - INFO - __main__ - Step 2714: {'lr': 0.0004999713676432082, 'samples': 521088, 'steps': 2713, 'loss/train': 2.1871511936187744}} +11/06/2021 21:38:57 - INFO - __main__ - Step 2718: {'lr': 0.0004999710454876099, 'samples': 521856, 'steps': 2717, 'loss/train': 2.10378360748291}4}} +11/06/2021 21:39:00 - INFO - __main__ - Step 2722: {'lr': 0.000499970721529882, 'samples': 522624, 'steps': 2721, 'loss/train': 3.079136848449707}4}} +11/06/2021 21:39:02 - INFO - __main__ - Step 2727: {'lr': 0.000499970314048481, 'samples': 523584, 'steps': 2726, 'loss/train': 2.2870664596557617}}} +11/06/2021 21:39:04 - INFO - __main__ - Step 2731: {'lr': 0.0004999699860359702, 'samples': 524352, 'steps': 2730, 'loss/train': 2.656719446182251}}} +11/06/2021 21:39:06 - INFO - __main__ - Step 2735: {'lr': 0.0004999696562213375, 'samples': 525120, 'steps': 2734, 'loss/train': 2.221712827682495}}} +11/06/2021 21:39:08 - INFO - __main__ - Step 2739: {'lr': 0.0004999693246045854, 'samples': 525888, 'steps': 2738, 'loss/train': 2.2682254314422607}} +11/06/2021 21:39:09 - INFO - __main__ - Step 2743: {'lr': 0.000499968991185716, 'samples': 526656, 'steps': 2742, 'loss/train': 2.7001304626464844}}} +11/06/2021 21:39:11 - INFO - __main__ - Step 2747: {'lr': 0.0004999686559647319, 'samples': 527424, 'steps': 2746, 'loss/train': 2.5279910564422607}} +11/06/2021 21:39:11 - INFO - __main__ - Step 2747: {'lr': 0.0004999686559647319, 'samples': 527424, 'steps': 2746, 'loss/train': 2.5279910564422607}} +11/06/2021 21:39:11 - INFO - __main__ - Step 2747: {'lr': 0.0004999686559647319, 'samples': 527424, 'steps': 2746, 'loss/train': 2.5279910564422607}} +11/06/2021 21:39:17 - INFO - __main__ - Step 2758: {'lr': 0.0004999677248148916, 'samples': 529536, 'steps': 2757, 'loss/train': 2.4732248783111572}} +11/06/2021 21:39:20 - INFO - __main__ - Step 2764: {'lr': 0.0004999672111707639, 'samples': 530688, 'steps': 2763, 'loss/train': 3.058380603790283}}} +11/06/2021 21:39:22 - INFO - __main__ - Step 2768: {'lr': 0.0004999668664887175, 'samples': 531456, 'steps': 2767, 'loss/train': 2.2657551765441895}} +11/06/2021 21:39:24 - INFO - __main__ - Step 2772: {'lr': 0.0004999665200045716, 'samples': 532224, 'steps': 2771, 'loss/train': 1.0660734176635742}} +11/06/2021 21:39:26 - INFO - __main__ - Step 2776: {'lr': 0.000499966171718329, 'samples': 532992, 'steps': 2775, 'loss/train': 2.4398868083953857}}} +11/06/2021 21:39:28 - INFO - __main__ - Step 2780: {'lr': 0.0004999658216299919, 'samples': 533760, 'steps': 2779, 'loss/train': 2.217278242111206}}} +11/06/2021 21:39:30 - INFO - __main__ - Step 2785: {'lr': 0.0004999653814853791, 'samples': 534720, 'steps': 2784, 'loss/train': 2.1000912189483643}} +11/06/2021 21:39:32 - INFO - __main__ - Step 2789: {'lr': 0.0004999650273423389, 'samples': 535488, 'steps': 2788, 'loss/train': 2.207897663116455}}} +11/06/2021 21:39:32 - INFO - __main__ - Step 2789: {'lr': 0.0004999650273423389, 'samples': 535488, 'steps': 2788, 'loss/train': 2.207897663116455}}} +11/06/2021 21:39:35 - INFO - __main__ - Step 2795: {'lr': 0.0004999644927488678, 'samples': 536640, 'steps': 2794, 'loss/train': 2.290945529937744}}} +11/06/2021 21:39:38 - INFO - __main__ - Step 2800: {'lr': 0.0004999640441569793, 'samples': 537600, 'steps': 2799, 'loss/train': 1.9303408861160278}} +11/06/2021 21:39:40 - INFO - __main__ - Step 2805: {'lr': 0.0004999635927493423, 'samples': 538560, 'steps': 2804, 'loss/train': 2.4244282245635986}} +11/06/2021 21:39:40 - INFO - __main__ - Step 2805: {'lr': 0.0004999635927493423, 'samples': 538560, 'steps': 2804, 'loss/train': 2.4244282245635986}} +11/06/2021 21:39:44 - INFO - __main__ - Step 2812: {'lr': 0.0004999629560482026, 'samples': 539904, 'steps': 2811, 'loss/train': 1.2682995796203613}} +11/06/2021 21:39:46 - INFO - __main__ - Step 2816: {'lr': 0.0004999625897411311, 'samples': 540672, 'steps': 2815, 'loss/train': 2.5656561851501465}} +11/06/2021 21:39:48 - INFO - __main__ - Step 2821: {'lr': 0.0004999621293231331, 'samples': 541632, 'steps': 2820, 'loss/train': 2.8650639057159424}} +11/06/2021 21:39:50 - INFO - __main__ - Step 2825: {'lr': 0.000499961758961411, 'samples': 542400, 'steps': 2824, 'loss/train': 2.4017333984375}424}} +11/06/2021 21:39:52 - INFO - __main__ - Step 2829: {'lr': 0.0004999613867976264, 'samples': 543168, 'steps': 2828, 'loss/train': 2.7821502685546875}} +11/06/2021 21:39:54 - INFO - __main__ - Step 2833: {'lr': 0.0004999610128317818, 'samples': 543936, 'steps': 2832, 'loss/train': 1.7340575456619263}} +11/06/2021 21:39:56 - INFO - __main__ - Step 2837: {'lr': 0.0004999606370638801, 'samples': 544704, 'steps': 2836, 'loss/train': 1.946204423904419}}} +11/06/2021 21:39:58 - INFO - __main__ - Step 2842: {'lr': 0.0004999601648198641, 'samples': 545664, 'steps': 2841, 'loss/train': 2.791858434677124}}} +11/06/2021 21:39:58 - INFO - __main__ - Step 2842: {'lr': 0.0004999601648198641, 'samples': 545664, 'steps': 2841, 'loss/train': 2.791858434677124}}} +11/06/2021 21:40:02 - INFO - __main__ - Step 2850: {'lr': 0.0004999594033727747, 'samples': 547200, 'steps': 2849, 'loss/train': 2.0793142318725586}} +11/06/2021 21:40:04 - INFO - __main__ - Step 2854: {'lr': 0.0004999590199461602, 'samples': 547968, 'steps': 2853, 'loss/train': 2.220766067504883}}} +11/06/2021 21:40:06 - INFO - __main__ - Step 2858: {'lr': 0.000499958634717503, 'samples': 548736, 'steps': 2857, 'loss/train': 1.4249017238616943}}} +11/06/2021 21:40:08 - INFO - __main__ - Step 2862: {'lr': 0.0004999582476868055, 'samples': 549504, 'steps': 2861, 'loss/train': 2.6905484199523926}} +11/06/2021 21:40:10 - INFO - __main__ - Step 2867: {'lr': 0.0004999577613643192, 'samples': 550464, 'steps': 2866, 'loss/train': 2.0363290309906006}} +11/06/2021 21:40:10 - INFO - __main__ - Step 2867: {'lr': 0.0004999577613643192, 'samples': 550464, 'steps': 2866, 'loss/train': 2.0363290309906006}} +11/06/2021 21:40:14 - INFO - __main__ - Step 2874: {'lr': 0.000499957075782501, 'samples': 551808, 'steps': 2873, 'loss/train': 1.8168832063674927}}} +11/06/2021 21:40:16 - INFO - __main__ - Step 2878: {'lr': 0.0004999566815436715, 'samples': 552576, 'steps': 2877, 'loss/train': 2.445081949234009}}} +11/06/2021 21:40:18 - INFO - __main__ - Step 2883: {'lr': 0.0004999561862110358, 'samples': 553536, 'steps': 2882, 'loss/train': 1.861746072769165}}} +11/06/2021 21:40:18 - INFO - __main__ - Step 2883: {'lr': 0.0004999561862110358, 'samples': 553536, 'steps': 2882, 'loss/train': 1.861746072769165}}} +11/06/2021 21:40:22 - INFO - __main__ - Step 2891: {'lr': 0.0004999553878222482, 'samples': 555072, 'steps': 2890, 'loss/train': 1.2182731628417969}} +11/06/2021 21:40:24 - INFO - __main__ - Step 2895: {'lr': 0.000499954985924828, 'samples': 555840, 'steps': 2894, 'loss/train': 1.992488980293274}9}} +11/06/2021 21:40:26 - INFO - __main__ - Step 2899: {'lr': 0.0004999545822253941, 'samples': 556608, 'steps': 2898, 'loss/train': 1.9909908771514893}} +11/06/2021 21:40:28 - INFO - __main__ - Step 2903: {'lr': 0.0004999541767239493, 'samples': 557376, 'steps': 2902, 'loss/train': 2.2086076736450195}} +11/06/2021 21:40:30 - INFO - __main__ - Step 2909: {'lr': 0.0004999535650930182, 'samples': 558528, 'steps': 2908, 'loss/train': 1.6833531856536865}} +11/06/2021 21:40:30 - INFO - __main__ - Step 2909: {'lr': 0.0004999535650930182, 'samples': 558528, 'steps': 2908, 'loss/train': 1.6833531856536865}} +11/06/2021 21:40:34 - INFO - __main__ - Step 2914: {'lr': 0.0004999530523033817, 'samples': 559488, 'steps': 2913, 'loss/train': 1.3060599565505981}} +11/06/2021 21:40:36 - INFO - __main__ - Step 2920: {'lr': 0.0004999524332391937, 'samples': 560640, 'steps': 2919, 'loss/train': 1.4589003324508667}} +11/06/2021 21:40:38 - INFO - __main__ - Step 2924: {'lr': 0.0004999520182772402, 'samples': 561408, 'steps': 2923, 'loss/train': 2.112090826034546}}} +11/06/2021 21:40:41 - INFO - __main__ - Step 2928: {'lr': 0.0004999516015132945, 'samples': 562176, 'steps': 2927, 'loss/train': 1.2997283935546875}} +11/06/2021 21:40:43 - INFO - __main__ - Step 2932: {'lr': 0.0004999511829473593, 'samples': 562944, 'steps': 2931, 'loss/train': 1.8353915214538574}} +11/06/2021 21:40:44 - INFO - __main__ - Step 2936: {'lr': 0.0004999507625794378, 'samples': 563712, 'steps': 2935, 'loss/train': 2.2181787490844727}} +11/06/2021 21:40:46 - INFO - __main__ - Step 2940: {'lr': 0.000499950340409533, 'samples': 564480, 'steps': 2939, 'loss/train': 2.1608986854553223}}} +11/06/2021 21:40:49 - INFO - __main__ - Step 2945: {'lr': 0.0004999498101631177, 'samples': 565440, 'steps': 2944, 'loss/train': 2.750171422958374}}} +11/06/2021 21:40:51 - INFO - __main__ - Step 2949: {'lr': 0.0004999493839387615, 'samples': 566208, 'steps': 2948, 'loss/train': 0.8493632674217224}} +11/06/2021 21:40:51 - INFO - __main__ - Step 2949: {'lr': 0.0004999493839387615, 'samples': 566208, 'steps': 2948, 'loss/train': 0.8493632674217224}} +11/06/2021 21:40:54 - INFO - __main__ - Step 2956: {'lr': 0.0004999486337101419, 'samples': 567552, 'steps': 2955, 'loss/train': 2.1768510341644287}} +11/06/2021 21:40:56 - INFO - __main__ - Step 2961: {'lr': 0.0004999480944538655, 'samples': 568512, 'steps': 2960, 'loss/train': 2.1335995197296143}} +11/06/2021 21:40:59 - INFO - __main__ - Step 2966: {'lr': 0.0004999475523820203, 'samples': 569472, 'steps': 2965, 'loss/train': 1.6673521995544434}} +11/06/2021 21:41:01 - INFO - __main__ - Step 2970: {'lr': 0.0004999471166973385, 'samples': 570240, 'steps': 2969, 'loss/train': 2.754880905151367}}} +11/06/2021 21:41:01 - INFO - __main__ - Step 2970: {'lr': 0.0004999471166973385, 'samples': 570240, 'steps': 2969, 'loss/train': 2.754880905151367}}} +11/06/2021 21:41:04 - INFO - __main__ - Step 2977: {'lr': 0.0004999463499131884, 'samples': 571584, 'steps': 2976, 'loss/train': 2.5181667804718018}} +11/06/2021 21:41:06 - INFO - __main__ - Step 2982: {'lr': 0.000499945798831564, 'samples': 572544, 'steps': 2981, 'loss/train': 2.780032157897949}8}} +11/06/2021 21:41:09 - INFO - __main__ - Step 2987: {'lr': 0.0004999452449343967, 'samples': 573504, 'steps': 2986, 'loss/train': 2.3532779216766357}} +11/06/2021 21:41:11 - INFO - __main__ - Step 2991: {'lr': 0.000499944799789476, 'samples': 574272, 'steps': 2990, 'loss/train': 2.203000545501709}7}} +11/06/2021 21:41:13 - INFO - __main__ - Step 2995: {'lr': 0.0004999443528426149, 'samples': 575040, 'steps': 2994, 'loss/train': 2.4999752044677734}} +11/06/2021 21:41:14 - INFO - __main__ - Step 2999: {'lr': 0.0004999439040938168, 'samples': 575808, 'steps': 2998, 'loss/train': 2.217271327972412}}} +11/06/2021 21:41:16 - INFO - __main__ - Step 3003: {'lr': 0.0004999434535430848, 'samples': 576576, 'steps': 3002, 'loss/train': 2.3395111560821533}} +11/06/2021 21:41:19 - INFO - __main__ - Step 3008: {'lr': 0.0004999428878207054, 'samples': 577536, 'steps': 3007, 'loss/train': 2.3040289878845215}} +11/06/2021 21:41:21 - INFO - __main__ - Step 3012: {'lr': 0.0004999424332156341, 'samples': 578304, 'steps': 3011, 'loss/train': 1.8335940837860107}} +11/06/2021 21:41:21 - INFO - __main__ - Step 3012: {'lr': 0.0004999424332156341, 'samples': 578304, 'steps': 3011, 'loss/train': 1.8335940837860107}} +11/06/2021 21:41:24 - INFO - __main__ - Step 3019: {'lr': 0.0004999416333208835, 'samples': 579648, 'steps': 3018, 'loss/train': 1.6759024858474731}} +11/06/2021 21:41:26 - INFO - __main__ - Step 3023: {'lr': 0.0004999411737605313, 'samples': 580416, 'steps': 3022, 'loss/train': 1.946350336074829}}} +11/06/2021 21:41:26 - INFO - __main__ - Step 3023: {'lr': 0.0004999411737605313, 'samples': 580416, 'steps': 3022, 'loss/train': 1.946350336074829}}} +11/06/2021 21:41:31 - INFO - __main__ - Step 3031: {'lr': 0.0004999402492340875, 'samples': 581952, 'steps': 3030, 'loss/train': 2.4372713565826416}} +11/06/2021 21:41:33 - INFO - __main__ - Step 3035: {'lr': 0.0004999397842680027, 'samples': 582720, 'steps': 3034, 'loss/train': 2.364650249481201}}} +11/06/2021 21:41:34 - INFO - __main__ - Step 3039: {'lr': 0.0004999393175000137, 'samples': 583488, 'steps': 3038, 'loss/train': 2.1946680545806885}} +11/06/2021 21:41:37 - INFO - __main__ - Step 3043: {'lr': 0.000499938848930124, 'samples': 584256, 'steps': 3042, 'loss/train': 1.9267772436141968}}} +11/06/2021 21:41:37 - INFO - __main__ - Step 3043: {'lr': 0.000499938848930124, 'samples': 584256, 'steps': 3042, 'loss/train': 1.9267772436141968}}} +11/06/2021 21:41:40 - INFO - __main__ - Step 3051: {'lr': 0.0004999379063846555, 'samples': 585792, 'steps': 3050, 'loss/train': 2.1658904552459717}} +11/06/2021 21:41:42 - INFO - __main__ - Step 3055: {'lr': 0.0004999374324090837, 'samples': 586560, 'steps': 3054, 'loss/train': 2.6458959579467773}} +11/06/2021 21:41:45 - INFO - __main__ - Step 3060: {'lr': 0.0004999368374057155, 'samples': 587520, 'steps': 3059, 'loss/train': 2.637629985809326}}} +11/06/2021 21:41:47 - INFO - __main__ - Step 3064: {'lr': 0.0004999363593759022, 'samples': 588288, 'steps': 3063, 'loss/train': 2.5826447010040283}} +11/06/2021 21:41:47 - INFO - __main__ - Step 3064: {'lr': 0.0004999363593759022, 'samples': 588288, 'steps': 3063, 'loss/train': 2.5826447010040283}} +11/06/2021 21:41:50 - INFO - __main__ - Step 3071: {'lr': 0.0004999355184879587, 'samples': 589632, 'steps': 3070, 'loss/train': 1.911078691482544}}} +11/06/2021 21:41:53 - INFO - __main__ - Step 3076: {'lr': 0.0004999349144751997, 'samples': 590592, 'steps': 3075, 'loss/train': 2.093614339828491}}} +11/06/2021 21:41:53 - INFO - __main__ - Step 3076: {'lr': 0.0004999349144751997, 'samples': 590592, 'steps': 3075, 'loss/train': 2.093614339828491}}} +11/06/2021 21:41:56 - INFO - __main__ - Step 3082: {'lr': 0.0004999341859435345, 'samples': 591744, 'steps': 3081, 'loss/train': 2.610215902328491}}} +11/06/2021 21:41:56 - INFO - __main__ - Step 3082: {'lr': 0.0004999341859435345, 'samples': 591744, 'steps': 3081, 'loss/train': 2.610215902328491}}} +11/06/2021 21:42:01 - INFO - __main__ - Step 3091: {'lr': 0.0004999330855444274, 'samples': 593472, 'steps': 3090, 'loss/train': 2.4830446243286133}} +11/06/2021 21:42:02 - INFO - __main__ - Step 3095: {'lr': 0.0004999325935501395, 'samples': 594240, 'steps': 3094, 'loss/train': 2.2615649700164795}} +11/06/2021 21:42:04 - INFO - __main__ - Step 3099: {'lr': 0.0004999320997539992, 'samples': 595008, 'steps': 3098, 'loss/train': 2.1478734016418457}} +11/06/2021 21:42:07 - INFO - __main__ - Step 3104: {'lr': 0.0004999314799749745, 'samples': 595968, 'steps': 3103, 'loss/train': 3.2617650032043457}} +11/06/2021 21:42:07 - INFO - __main__ - Step 3104: {'lr': 0.0004999314799749745, 'samples': 595968, 'steps': 3103, 'loss/train': 3.2617650032043457}} +11/06/2021 21:42:10 - INFO - __main__ - Step 3111: {'lr': 0.0004999306075545002, 'samples': 597312, 'steps': 3110, 'loss/train': 2.7295010089874268}} +11/06/2021 21:42:12 - INFO - __main__ - Step 3115: {'lr': 0.0004999301065509863, 'samples': 598080, 'steps': 3114, 'loss/train': 2.4557383060455322}} +11/06/2021 21:42:15 - INFO - __main__ - Step 3120: {'lr': 0.0004999294777627649, 'samples': 599040, 'steps': 3119, 'loss/train': 1.3478337526321411}} +11/06/2021 21:42:17 - INFO - __main__ - Step 3125: {'lr': 0.0004999288461591842, 'samples': 600000, 'steps': 3124, 'loss/train': 1.7113127708435059}} +11/06/2021 21:42:17 - INFO - __main__ - Step 3125: {'lr': 0.0004999288461591842, 'samples': 600000, 'steps': 3124, 'loss/train': 1.7113127708435059}} +11/06/2021 21:42:17 - INFO - __main__ - Step 3125: {'lr': 0.0004999288461591842, 'samples': 600000, 'steps': 3124, 'loss/train': 1.7113127708435059}} +11/06/2021 21:42:22 - INFO - __main__ - Step 3135: {'lr': 0.0004999275745059741, 'samples': 601920, 'steps': 3134, 'loss/train': 2.9237546920776367}} +11/06/2021 21:42:25 - INFO - __main__ - Step 3141: {'lr': 0.0004999268061085959, 'samples': 603072, 'steps': 3140, 'loss/train': 2.418550968170166}}} +11/06/2021 21:42:25 - INFO - __main__ - Step 3141: {'lr': 0.0004999268061085959, 'samples': 603072, 'steps': 3140, 'loss/train': 2.418550968170166}}} +11/06/2021 21:42:29 - INFO - __main__ - Step 3148: {'lr': 0.0004999259045210901, 'samples': 604416, 'steps': 3147, 'loss/train': 1.4385805130004883}} +11/06/2021 21:42:30 - INFO - __main__ - Step 3152: {'lr': 0.0004999253868507476, 'samples': 605184, 'steps': 3151, 'loss/train': 2.5812270641326904}} +11/06/2021 21:42:33 - INFO - __main__ - Step 3156: {'lr': 0.0004999248673786049, 'samples': 605952, 'steps': 3155, 'loss/train': 1.7660547494888306}} +11/06/2021 21:42:35 - INFO - __main__ - Step 3162: {'lr': 0.0004999240847920233, 'samples': 607104, 'steps': 3161, 'loss/train': 1.7738767862319946}} +11/06/2021 21:42:37 - INFO - __main__ - Step 3166: {'lr': 0.0004999235608153961, 'samples': 607872, 'steps': 3165, 'loss/train': 1.9972015619277954}} +11/06/2021 21:42:39 - INFO - __main__ - Step 3170: {'lr': 0.0004999230350369816, 'samples': 608640, 'steps': 3169, 'loss/train': 2.8902382850646973}} +11/06/2021 21:42:39 - INFO - __main__ - Step 3170: {'lr': 0.0004999230350369816, 'samples': 608640, 'steps': 3169, 'loss/train': 2.8902382850646973}} +11/06/2021 21:42:42 - INFO - __main__ - Step 3177: {'lr': 0.0004999221105892172, 'samples': 609984, 'steps': 3176, 'loss/train': 2.14980411529541}3}} +11/06/2021 21:42:45 - INFO - __main__ - Step 3182: {'lr': 0.000499921446891053, 'samples': 610944, 'steps': 3181, 'loss/train': 2.965468168258667}3}} +11/06/2021 21:42:47 - INFO - __main__ - Step 3187: {'lr': 0.0004999207803776201, 'samples': 611904, 'steps': 3186, 'loss/train': 2.031585693359375}}} +11/06/2021 21:42:49 - INFO - __main__ - Step 3191: {'lr': 0.0004999202451398853, 'samples': 612672, 'steps': 3190, 'loss/train': 2.0862905979156494}} +11/06/2021 21:42:49 - INFO - __main__ - Step 3191: {'lr': 0.0004999202451398853, 'samples': 612672, 'steps': 3190, 'loss/train': 2.0862905979156494}} +11/06/2021 21:42:53 - INFO - __main__ - Step 3198: {'lr': 0.0004999193041383588, 'samples': 614016, 'steps': 3197, 'loss/train': 2.2492079734802246}} +11/06/2021 21:42:55 - INFO - __main__ - Step 3203: {'lr': 0.0004999186286161169, 'samples': 614976, 'steps': 3202, 'loss/train': 2.909585952758789}}} +11/06/2021 21:42:55 - INFO - __main__ - Step 3203: {'lr': 0.0004999186286161169, 'samples': 614976, 'steps': 3202, 'loss/train': 2.909585952758789}}} +11/06/2021 21:42:55 - INFO - __main__ - Step 3203: {'lr': 0.0004999186286161169, 'samples': 614976, 'steps': 3202, 'loss/train': 2.909585952758789}}} +11/06/2021 21:43:00 - INFO - __main__ - Step 3213: {'lr': 0.0004999172691259293, 'samples': 616896, 'steps': 3212, 'loss/train': 1.8541127443313599}} +11/06/2021 21:43:00 - INFO - __main__ - Step 3213: {'lr': 0.0004999172691259293, 'samples': 616896, 'steps': 3212, 'loss/train': 1.8541127443313599}} +11/06/2021 21:43:05 - INFO - __main__ - Step 3222: {'lr': 0.0004999160359567011, 'samples': 618624, 'steps': 3221, 'loss/train': 1.9945106506347656}} +11/06/2021 21:43:07 - INFO - __main__ - Step 3226: {'lr': 0.0004999154849536698, 'samples': 619392, 'steps': 3225, 'loss/train': 2.3978424072265625}} +11/06/2021 21:43:08 - INFO - __main__ - Step 3230: {'lr': 0.0004999149321489095, 'samples': 620160, 'steps': 3229, 'loss/train': 3.806713581085205}}} +11/06/2021 21:43:10 - INFO - __main__ - Step 3234: {'lr': 0.0004999143775424241, 'samples': 620928, 'steps': 3233, 'loss/train': 2.1690218448638916}} +11/06/2021 21:43:13 - INFO - __main__ - Step 3239: {'lr': 0.0004999136817506478, 'samples': 621888, 'steps': 3238, 'loss/train': 2.375570297241211}}} +11/06/2021 21:43:15 - INFO - __main__ - Step 3243: {'lr': 0.000499913123090296, 'samples': 622656, 'steps': 3242, 'loss/train': 2.318620204925537}}}} +11/06/2021 21:43:17 - INFO - __main__ - Step 3247: {'lr': 0.0004999125626282322, 'samples': 623424, 'steps': 3246, 'loss/train': 2.054605484008789}}} +11/06/2021 21:43:17 - INFO - __main__ - Step 3247: {'lr': 0.0004999125626282322, 'samples': 623424, 'steps': 3246, 'loss/train': 2.054605484008789}}} +11/06/2021 21:43:20 - INFO - __main__ - Step 3255: {'lr': 0.0004999114362989849, 'samples': 624960, 'steps': 3254, 'loss/train': 2.2318007946014404}} +11/06/2021 21:43:23 - INFO - __main__ - Step 3260: {'lr': 0.0004999107286835006, 'samples': 625920, 'steps': 3259, 'loss/train': 0.5624179244041443}} +11/06/2021 21:43:25 - INFO - __main__ - Step 3264: {'lr': 0.0004999101605642061, 'samples': 626688, 'steps': 3263, 'loss/train': 2.3034634590148926}} +11/06/2021 21:43:25 - INFO - __main__ - Step 3264: {'lr': 0.0004999101605642061, 'samples': 626688, 'steps': 3263, 'loss/train': 2.3034634590148926}} +11/06/2021 21:43:28 - INFO - __main__ - Step 3271: {'lr': 0.0004999091620201255, 'samples': 628032, 'steps': 3270, 'loss/train': 4.105412006378174}}} +11/06/2021 21:43:31 - INFO - __main__ - Step 3277: {'lr': 0.0004999083017335951, 'samples': 629184, 'steps': 3276, 'loss/train': 2.3697509765625}4}}} +11/06/2021 21:43:33 - INFO - __main__ - Step 3281: {'lr': 0.0004999077259571442, 'samples': 629952, 'steps': 3280, 'loss/train': 2.139662504196167}}} +11/06/2021 21:43:33 - INFO - __main__ - Step 3281: {'lr': 0.0004999077259571442, 'samples': 629952, 'steps': 3280, 'loss/train': 2.139662504196167}}} +11/06/2021 21:43:36 - INFO - __main__ - Step 3288: {'lr': 0.0004999067140130819, 'samples': 631296, 'steps': 3287, 'loss/train': 2.0896875858306885}} +11/06/2021 21:43:39 - INFO - __main__ - Step 3292: {'lr': 0.0004999061332820401, 'samples': 632064, 'steps': 3291, 'loss/train': 1.7333624362945557}} +11/06/2021 21:43:41 - INFO - __main__ - Step 3297: {'lr': 0.0004999054048346517, 'samples': 633024, 'steps': 3296, 'loss/train': 2.7712512016296387}} +11/06/2021 21:43:43 - INFO - __main__ - Step 3302: {'lr': 0.0004999046735721755, 'samples': 633984, 'steps': 3301, 'loss/train': 2.4104175567626953}} +11/06/2021 21:43:43 - INFO - __main__ - Step 3302: {'lr': 0.0004999046735721755, 'samples': 633984, 'steps': 3301, 'loss/train': 2.4104175567626953}} +11/06/2021 21:43:47 - INFO - __main__ - Step 3309: {'lr': 0.0004999036450753767, 'samples': 635328, 'steps': 3308, 'loss/train': 2.1639621257781982}} +11/06/2021 21:43:48 - INFO - __main__ - Step 3313: {'lr': 0.0004999030548856586, 'samples': 636096, 'steps': 3312, 'loss/train': 1.3736777305603027}} +11/06/2021 21:43:51 - INFO - __main__ - Step 3318: {'lr': 0.0004999023146149565, 'samples': 637056, 'steps': 3317, 'loss/train': 1.93985116481781}7}} +11/06/2021 21:43:53 - INFO - __main__ - Step 3323: {'lr': 0.000499901571529201, 'samples': 638016, 'steps': 3322, 'loss/train': 1.9539903402328491}}} +11/06/2021 21:43:55 - INFO - __main__ - Step 3327: {'lr': 0.000499900975033764, 'samples': 638784, 'steps': 3326, 'loss/train': 2.444103240966797}}}} +11/06/2021 21:43:55 - INFO - __main__ - Step 3327: {'lr': 0.000499900975033764, 'samples': 638784, 'steps': 3326, 'loss/train': 2.444103240966797}}}} +11/06/2021 21:43:59 - INFO - __main__ - Step 3334: {'lr': 0.0004998999268315932, 'samples': 640128, 'steps': 3333, 'loss/train': 2.300365447998047}}} +11/06/2021 21:44:01 - INFO - __main__ - Step 3339: {'lr': 0.000499899174737724, 'samples': 641088, 'steps': 3338, 'loss/train': 2.363450765609741}}}} +11/06/2021 21:44:03 - INFO - __main__ - Step 3343: {'lr': 0.0004998985710358155, 'samples': 641856, 'steps': 3342, 'loss/train': 1.9851315021514893}} +11/06/2021 21:44:05 - INFO - __main__ - Step 3347: {'lr': 0.0004998979655323, 'samples': 642624, 'steps': 3346, 'loss/train': 1.8560844659805298}93}} +11/06/2021 21:44:05 - INFO - __main__ - Step 3347: {'lr': 0.0004998979655323, 'samples': 642624, 'steps': 3346, 'loss/train': 1.8560844659805298}93}} +11/06/2021 21:44:09 - INFO - __main__ - Step 3354: {'lr': 0.0004998969015660438, 'samples': 643968, 'steps': 3353, 'loss/train': 1.8647414445877075}} +11/06/2021 21:44:09 - INFO - __main__ - Step 3354: {'lr': 0.0004998969015660438, 'samples': 643968, 'steps': 3353, 'loss/train': 1.8647414445877075}} +11/06/2021 21:44:13 - INFO - __main__ - Step 3363: {'lr': 0.0004998955255022547, 'samples': 645696, 'steps': 3362, 'loss/train': 2.9360525608062744}} +11/06/2021 21:44:15 - INFO - __main__ - Step 3367: {'lr': 0.0004998949109907697, 'samples': 646464, 'steps': 3366, 'loss/train': 2.29533052444458}4}} +11/06/2021 21:44:17 - INFO - __main__ - Step 3371: {'lr': 0.000499894294677704, 'samples': 647232, 'steps': 3370, 'loss/train': 2.024826765060425}4}} +11/06/2021 21:44:19 - INFO - __main__ - Step 3375: {'lr': 0.000499893676563062, 'samples': 648000, 'steps': 3374, 'loss/train': 2.1932318210601807}}} +11/06/2021 21:44:21 - INFO - __main__ - Step 3380: {'lr': 0.0004998929013863, 'samples': 648960, 'steps': 3379, 'loss/train': 1.080916404724121}07}}} +11/06/2021 21:44:21 - INFO - __main__ - Step 3380: {'lr': 0.0004998929013863, 'samples': 648960, 'steps': 3379, 'loss/train': 1.080916404724121}07}}} +11/06/2021 21:44:25 - INFO - __main__ - Step 3387: {'lr': 0.0004998918114097237, 'samples': 650304, 'steps': 3386, 'loss/train': 2.346414566040039}}} +11/06/2021 21:44:27 - INFO - __main__ - Step 3391: {'lr': 0.0004998911860888217, 'samples': 651072, 'steps': 3390, 'loss/train': 1.96201491355896}}}} +11/06/2021 21:44:29 - INFO - __main__ - Step 3396: {'lr': 0.0004998904019042596, 'samples': 652032, 'steps': 3395, 'loss/train': 2.2461233139038086}} +11/06/2021 21:44:32 - INFO - __main__ - Step 3401: {'lr': 0.0004998896149047786, 'samples': 652992, 'steps': 3400, 'loss/train': 2.4505343437194824}} +11/06/2021 21:44:32 - INFO - __main__ - Step 3401: {'lr': 0.0004998896149047786, 'samples': 652992, 'steps': 3400, 'loss/train': 2.4505343437194824}} +11/06/2021 21:44:35 - INFO - __main__ - Step 3408: {'lr': 0.0004998885083764582, 'samples': 654336, 'steps': 3407, 'loss/train': 2.54028582572937}4}} +11/06/2021 21:44:37 - INFO - __main__ - Step 3412: {'lr': 0.0004998878735974493, 'samples': 655104, 'steps': 3411, 'loss/train': 2.2348644733428955}} +11/06/2021 21:44:39 - INFO - __main__ - Step 3417: {'lr': 0.0004998870775902872, 'samples': 656064, 'steps': 3416, 'loss/train': 2.356597900390625}}} +11/06/2021 21:44:39 - INFO - __main__ - Step 3417: {'lr': 0.0004998870775902872, 'samples': 656064, 'steps': 3416, 'loss/train': 2.356597900390625}}} +11/06/2021 21:44:39 - INFO - __main__ - Step 3417: {'lr': 0.0004998870775902872, 'samples': 656064, 'steps': 3416, 'loss/train': 2.356597900390625}}} +11/06/2021 21:44:45 - INFO - __main__ - Step 3428: {'lr': 0.0004998853164661606, 'samples': 658176, 'steps': 3427, 'loss/train': 1.7819459438323975}} +11/06/2021 21:44:47 - INFO - __main__ - Step 3433: {'lr': 0.0004998845114514095, 'samples': 659136, 'steps': 3432, 'loss/train': 1.8727471828460693}} +11/06/2021 21:44:47 - INFO - __main__ - Step 3433: {'lr': 0.0004998845114514095, 'samples': 659136, 'steps': 3432, 'loss/train': 1.8727471828460693}} +11/06/2021 21:44:52 - INFO - __main__ - Step 3440: {'lr': 0.0004998833797018074, 'samples': 660480, 'steps': 3439, 'loss/train': 1.823896050453186}}} +11/06/2021 21:44:53 - INFO - __main__ - Step 3444: {'lr': 0.0004998827305106884, 'samples': 661248, 'steps': 3443, 'loss/train': 1.7395120859146118}} +11/06/2021 21:44:55 - INFO - __main__ - Step 3448: {'lr': 0.0004998820795180766, 'samples': 662016, 'steps': 3447, 'loss/train': 2.5539913177490234}} +11/06/2021 21:44:58 - INFO - __main__ - Step 3453: {'lr': 0.0004998812632439697, 'samples': 662976, 'steps': 3452, 'loss/train': 1.7184646129608154}} +11/06/2021 21:45:00 - INFO - __main__ - Step 3457: {'lr': 0.0004998806081980162, 'samples': 663744, 'steps': 3456, 'loss/train': 2.589240074157715}}} +11/06/2021 21:45:02 - INFO - __main__ - Step 3461: {'lr': 0.0004998799513505851, 'samples': 664512, 'steps': 3460, 'loss/train': 2.196791648864746}}} +11/06/2021 21:45:03 - INFO - __main__ - Step 3465: {'lr': 0.0004998792927016812, 'samples': 665280, 'steps': 3464, 'loss/train': 2.557910203933716}}} +11/06/2021 21:45:05 - INFO - __main__ - Step 3469: {'lr': 0.0004998786322513093, 'samples': 666048, 'steps': 3468, 'loss/train': 2.309483528137207}}} +11/06/2021 21:45:08 - INFO - __main__ - Step 3475: {'lr': 0.0004998776381980092, 'samples': 667200, 'steps': 3474, 'loss/train': 2.124244213104248}}} +11/06/2021 21:45:10 - INFO - __main__ - Step 3479: {'lr': 0.000499876973243988, 'samples': 667968, 'steps': 3478, 'loss/train': 1.411661148071289}}}} +11/06/2021 21:45:10 - INFO - __main__ - Step 3479: {'lr': 0.000499876973243988, 'samples': 667968, 'steps': 3478, 'loss/train': 1.411661148071289}}}} +11/06/2021 21:45:13 - INFO - __main__ - Step 3486: {'lr': 0.0004998758052397115, 'samples': 669312, 'steps': 3485, 'loss/train': 1.9367340803146362}} +11/06/2021 21:45:15 - INFO - __main__ - Step 3491: {'lr': 0.0004998749675732357, 'samples': 670272, 'steps': 3490, 'loss/train': 2.008915662765503}}} +11/06/2021 21:45:18 - INFO - __main__ - Step 3495: {'lr': 0.000499874295413438, 'samples': 671040, 'steps': 3494, 'loss/train': 1.9268534183502197}}} +11/06/2021 21:45:20 - INFO - __main__ - Step 3499: {'lr': 0.0004998736214522084, 'samples': 671808, 'steps': 3498, 'loss/train': 3.6572864055633545}} +11/06/2021 21:45:21 - INFO - __main__ - Step 3503: {'lr': 0.0004998729456895516, 'samples': 672576, 'steps': 3502, 'loss/train': 2.645084857940674}}} +11/06/2021 21:45:24 - INFO - __main__ - Step 3507: {'lr': 0.0004998722681254725, 'samples': 673344, 'steps': 3506, 'loss/train': 1.835058569908142}}} +11/06/2021 21:45:26 - INFO - __main__ - Step 3512: {'lr': 0.000499871418637131, 'samples': 674304, 'steps': 3511, 'loss/train': 1.7968868017196655}}} +11/06/2021 21:45:28 - INFO - __main__ - Step 3516: {'lr': 0.0004998707370198695, 'samples': 675072, 'steps': 3515, 'loss/train': 2.0000085830688477}} +11/06/2021 21:45:28 - INFO - __main__ - Step 3516: {'lr': 0.0004998707370198695, 'samples': 675072, 'steps': 3515, 'loss/train': 2.0000085830688477}} +11/06/2021 21:45:31 - INFO - __main__ - Step 3523: {'lr': 0.0004998695398550309, 'samples': 676416, 'steps': 3522, 'loss/train': 2.8342642784118652}} +11/06/2021 21:45:34 - INFO - __main__ - Step 3528: {'lr': 0.0004998686813596668, 'samples': 677376, 'steps': 3527, 'loss/train': 2.326568126678467}}} +11/06/2021 21:45:36 - INFO - __main__ - Step 3532: {'lr': 0.0004998679925368094, 'samples': 678144, 'steps': 3531, 'loss/train': 1.9451133012771606}} +11/06/2021 21:45:38 - INFO - __main__ - Step 3537: {'lr': 0.0004998671289750386, 'samples': 679104, 'steps': 3536, 'loss/train': 2.357372283935547}}} +11/06/2021 21:45:38 - INFO - __main__ - Step 3537: {'lr': 0.0004998671289750386, 'samples': 679104, 'steps': 3536, 'loss/train': 2.357372283935547}}} +11/06/2021 21:45:41 - INFO - __main__ - Step 3544: {'lr': 0.0004998659152599381, 'samples': 680448, 'steps': 3543, 'loss/train': 2.9186902046203613}} +11/06/2021 21:45:44 - INFO - __main__ - Step 3548: {'lr': 0.0004998652192315644, 'samples': 681216, 'steps': 3547, 'loss/train': 1.8039276599884033}} +11/06/2021 21:45:46 - INFO - __main__ - Step 3552: {'lr': 0.000499864521401824, 'samples': 681984, 'steps': 3551, 'loss/train': 2.100595474243164}3}} +11/06/2021 21:45:48 - INFO - __main__ - Step 3556: {'lr': 0.0004998638217707222, 'samples': 682752, 'steps': 3555, 'loss/train': 2.264774799346924}}} +11/06/2021 21:45:50 - INFO - __main__ - Step 3560: {'lr': 0.0004998631203382639, 'samples': 683520, 'steps': 3559, 'loss/train': 2.074711561203003}}} +11/06/2021 21:45:51 - INFO - __main__ - Step 3564: {'lr': 0.0004998624171044541, 'samples': 684288, 'steps': 3563, 'loss/train': 1.9695250988006592}} +11/06/2021 21:45:53 - INFO - __main__ - Step 3568: {'lr': 0.0004998617120692977, 'samples': 685056, 'steps': 3567, 'loss/train': 1.8647109270095825}} +11/06/2021 21:45:56 - INFO - __main__ - Step 3573: {'lr': 0.0004998608282422169, 'samples': 686016, 'steps': 3572, 'loss/train': 2.195950746536255}}} +11/06/2021 21:45:56 - INFO - __main__ - Step 3573: {'lr': 0.0004998608282422169, 'samples': 686016, 'steps': 3572, 'loss/train': 2.195950746536255}}} +11/06/2021 21:45:59 - INFO - __main__ - Step 3580: {'lr': 0.0004998595861558016, 'samples': 687360, 'steps': 3579, 'loss/train': 2.119218111038208}}} +11/06/2021 21:46:01 - INFO - __main__ - Step 3584: {'lr': 0.0004998588739153108, 'samples': 688128, 'steps': 3583, 'loss/train': 1.7447315454483032}} +11/06/2021 21:46:04 - INFO - __main__ - Step 3589: {'lr': 0.0004998579810815905, 'samples': 689088, 'steps': 3588, 'loss/train': 2.701934576034546}}} +11/06/2021 21:46:04 - INFO - __main__ - Step 3589: {'lr': 0.0004998579810815905, 'samples': 689088, 'steps': 3588, 'loss/train': 2.701934576034546}}} +11/06/2021 21:46:08 - INFO - __main__ - Step 3597: {'lr': 0.0004998565466933702, 'samples': 690624, 'steps': 3596, 'loss/train': 2.6100289821624756}} +11/06/2021 21:46:10 - INFO - __main__ - Step 3601: {'lr': 0.0004998558267973013, 'samples': 691392, 'steps': 3600, 'loss/train': 2.1335763931274414}} +11/06/2021 21:46:11 - INFO - __main__ - Step 3605: {'lr': 0.0004998551050999336, 'samples': 692160, 'steps': 3604, 'loss/train': 1.8231139183044434}} +11/06/2021 21:46:13 - INFO - __main__ - Step 3609: {'lr': 0.0004998543816012723, 'samples': 692928, 'steps': 3608, 'loss/train': 2.1296401023864746}} +11/06/2021 21:46:16 - INFO - __main__ - Step 3614: {'lr': 0.0004998534746948843, 'samples': 693888, 'steps': 3613, 'loss/train': 1.9264954328536987}} +11/06/2021 21:46:16 - INFO - __main__ - Step 3614: {'lr': 0.0004998534746948843, 'samples': 693888, 'steps': 3613, 'loss/train': 1.9264954328536987}} +11/06/2021 21:46:19 - INFO - __main__ - Step 3621: {'lr': 0.0004998522002975783, 'samples': 695232, 'steps': 3620, 'loss/train': 2.4836816787719727}} +11/06/2021 21:46:21 - INFO - __main__ - Step 3625: {'lr': 0.0004998514695937945, 'samples': 696000, 'steps': 3624, 'loss/train': 2.3775951862335205}} +11/06/2021 21:46:21 - INFO - __main__ - Step 3625: {'lr': 0.0004998514695937945, 'samples': 696000, 'steps': 3624, 'loss/train': 2.3775951862335205}} +11/06/2021 21:46:25 - INFO - __main__ - Step 3633: {'lr': 0.0004998500027824298, 'samples': 697536, 'steps': 3632, 'loss/train': 1.352131724357605}}} +11/06/2021 21:46:27 - INFO - __main__ - Step 3637: {'lr': 0.0004998492666748594, 'samples': 698304, 'steps': 3636, 'loss/train': 2.1306369304656982}} +11/06/2021 21:46:30 - INFO - __main__ - Step 3642: {'lr': 0.0004998483440073871, 'samples': 699264, 'steps': 3641, 'loss/train': 2.3207335472106934}} +11/06/2021 21:46:32 - INFO - __main__ - Step 3646: {'lr': 0.0004998476038470082, 'samples': 700032, 'steps': 3645, 'loss/train': 2.1402628421783447}} +11/06/2021 21:46:34 - INFO - __main__ - Step 3650: {'lr': 0.0004998468618853896, 'samples': 700800, 'steps': 3649, 'loss/train': 2.1500542163848877}} +11/06/2021 21:46:34 - INFO - __main__ - Step 3650: {'lr': 0.0004998468618853896, 'samples': 700800, 'steps': 3649, 'loss/train': 2.1500542163848877}} +11/06/2021 21:46:37 - INFO - __main__ - Step 3657: {'lr': 0.0004998455591183406, 'samples': 702144, 'steps': 3656, 'loss/train': 2.267188310623169}}} +11/06/2021 21:46:40 - INFO - __main__ - Step 3662: {'lr': 0.00049984462519315, 'samples': 703104, 'steps': 3661, 'loss/train': 2.506985664367676}9}}} +11/06/2021 21:46:42 - INFO - __main__ - Step 3667: {'lr': 0.0004998436884535562, 'samples': 704064, 'steps': 3666, 'loss/train': 1.854463815689087}}} +11/06/2021 21:46:42 - INFO - __main__ - Step 3667: {'lr': 0.0004998436884535562, 'samples': 704064, 'steps': 3666, 'loss/train': 1.854463815689087}}} +11/06/2021 21:46:45 - INFO - __main__ - Step 3674: {'lr': 0.0004998423722899475, 'samples': 705408, 'steps': 3673, 'loss/train': 1.8246042728424072}} +11/06/2021 21:46:47 - INFO - __main__ - Step 3678: {'lr': 0.0004998416177198022, 'samples': 706176, 'steps': 3677, 'loss/train': 1.930174708366394}}} +11/06/2021 21:46:50 - INFO - __main__ - Step 3683: {'lr': 0.0004998406719741888, 'samples': 707136, 'steps': 3682, 'loss/train': 1.118072509765625}}} +11/06/2021 21:46:52 - INFO - __main__ - Step 3687: {'lr': 0.0004998399133513594, 'samples': 707904, 'steps': 3686, 'loss/train': 2.232158899307251}}} +11/06/2021 21:46:54 - INFO - __main__ - Step 3691: {'lr': 0.0004998391529273457, 'samples': 708672, 'steps': 3690, 'loss/train': 2.0140085220336914}} +11/06/2021 21:46:54 - INFO - __main__ - Step 3691: {'lr': 0.0004998391529273457, 'samples': 708672, 'steps': 3690, 'loss/train': 2.0140085220336914}} +11/06/2021 21:46:57 - INFO - __main__ - Step 3698: {'lr': 0.0004998378178512388, 'samples': 710016, 'steps': 3697, 'loss/train': 2.363736391067505}}} +11/06/2021 21:47:00 - INFO - __main__ - Step 3704: {'lr': 0.0004998366691099395, 'samples': 711168, 'steps': 3703, 'loss/train': 1.9696950912475586}} +11/06/2021 21:47:02 - INFO - __main__ - Step 3708: {'lr': 0.0004998359010309544, 'samples': 711936, 'steps': 3707, 'loss/train': 2.483283758163452}}} +11/06/2021 21:47:04 - INFO - __main__ - Step 3712: {'lr': 0.0004998351311508143, 'samples': 712704, 'steps': 3711, 'loss/train': 1.7308366298675537}} +11/06/2021 21:47:06 - INFO - __main__ - Step 3716: {'lr': 0.0004998343594695242, 'samples': 713472, 'steps': 3715, 'loss/train': 1.7858660221099854}} +11/06/2021 21:47:08 - INFO - __main__ - Step 3720: {'lr': 0.0004998335859870903, 'samples': 714240, 'steps': 3719, 'loss/train': 1.7998706102371216}} +11/06/2021 21:47:10 - INFO - __main__ - Step 3724: {'lr': 0.0004998328107035176, 'samples': 715008, 'steps': 3723, 'loss/train': 2.392589807510376}}} +11/06/2021 21:47:12 - INFO - __main__ - Step 3729: {'lr': 0.0004998318390662095, 'samples': 715968, 'steps': 3728, 'loss/train': 1.9741984605789185}} +11/06/2021 21:47:14 - INFO - __main__ - Step 3733: {'lr': 0.0004998310597300956, 'samples': 716736, 'steps': 3732, 'loss/train': 2.505441665649414}}} +11/06/2021 21:47:14 - INFO - __main__ - Step 3733: {'lr': 0.0004998310597300956, 'samples': 716736, 'steps': 3732, 'loss/train': 2.505441665649414}}} +11/06/2021 21:47:17 - INFO - __main__ - Step 3740: {'lr': 0.0004998296915579539, 'samples': 718080, 'steps': 3739, 'loss/train': 2.2116055488586426}} +11/06/2021 21:47:20 - INFO - __main__ - Step 3745: {'lr': 0.0004998287109150547, 'samples': 719040, 'steps': 3744, 'loss/train': 1.8798199892044067}} +11/06/2021 21:47:22 - INFO - __main__ - Step 3750: {'lr': 0.0004998277274579313, 'samples': 720000, 'steps': 3749, 'loss/train': 2.172743558883667}}} +11/06/2021 21:47:24 - INFO - __main__ - Step 3754: {'lr': 0.0004998269386659988, 'samples': 720768, 'steps': 3753, 'loss/train': 2.281588077545166}}} +11/06/2021 21:47:26 - INFO - __main__ - Step 3758: {'lr': 0.0004998261480729755, 'samples': 721536, 'steps': 3757, 'loss/train': 2.4779069423675537}} +11/06/2021 21:47:28 - INFO - __main__ - Step 3762: {'lr': 0.0004998253556788675, 'samples': 722304, 'steps': 3761, 'loss/train': 2.088002920150757}}} +11/06/2021 21:47:30 - INFO - __main__ - Step 3766: {'lr': 0.0004998245614836802, 'samples': 723072, 'steps': 3765, 'loss/train': 2.278775930404663}}} +11/06/2021 21:47:32 - INFO - __main__ - Step 3771: {'lr': 0.0004998235662069372, 'samples': 724032, 'steps': 3770, 'loss/train': 1.7649283409118652}} +11/06/2021 21:47:32 - INFO - __main__ - Step 3771: {'lr': 0.0004998235662069372, 'samples': 724032, 'steps': 3770, 'loss/train': 1.7649283409118652}} +11/06/2021 21:47:36 - INFO - __main__ - Step 3778: {'lr': 0.0004998221680917004, 'samples': 725376, 'steps': 3777, 'loss/train': 2.202800989151001}}} +11/06/2021 21:47:36 - INFO - __main__ - Step 3778: {'lr': 0.0004998221680917004, 'samples': 725376, 'steps': 3777, 'loss/train': 2.202800989151001}}} +11/06/2021 21:47:40 - INFO - __main__ - Step 3786: {'lr': 0.0004998205634917566, 'samples': 726912, 'steps': 3785, 'loss/train': 2.1383769512176514}} +11/06/2021 21:47:42 - INFO - __main__ - Step 3791: {'lr': 0.0004998195569584168, 'samples': 727872, 'steps': 3790, 'loss/train': 2.279456377029419}}} +11/06/2021 21:47:45 - INFO - __main__ - Step 3796: {'lr': 0.000499818547610956, 'samples': 728832, 'steps': 3795, 'loss/train': 1.8099079132080078}}} +11/06/2021 21:47:45 - INFO - __main__ - Step 3796: {'lr': 0.000499818547610956, 'samples': 728832, 'steps': 3795, 'loss/train': 1.8099079132080078}}} +11/06/2021 21:47:48 - INFO - __main__ - Step 3803: {'lr': 0.0004998171297968095, 'samples': 730176, 'steps': 3802, 'loss/train': 2.3628175258636475}} +11/06/2021 21:47:50 - INFO - __main__ - Step 3807: {'lr': 0.0004998163171408928, 'samples': 730944, 'steps': 3806, 'loss/train': 2.0892038345336914}} +11/06/2021 21:47:50 - INFO - __main__ - Step 3807: {'lr': 0.0004998163171408928, 'samples': 730944, 'steps': 3806, 'loss/train': 2.0892038345336914}} +11/06/2021 21:47:55 - INFO - __main__ - Step 3815: {'lr': 0.0004998146864260231, 'samples': 732480, 'steps': 3814, 'loss/train': 2.178349733352661}}} +11/06/2021 21:47:56 - INFO - __main__ - Step 3819: {'lr': 0.000499813868367082, 'samples': 733248, 'steps': 3818, 'loss/train': 1.899258017539978}}}} +11/06/2021 21:47:58 - INFO - __main__ - Step 3823: {'lr': 0.0004998130485071444, 'samples': 734016, 'steps': 3822, 'loss/train': 2.2223479747772217}} +11/06/2021 21:48:00 - INFO - __main__ - Step 3828: {'lr': 0.0004998120211495803, 'samples': 734976, 'steps': 3827, 'loss/train': 1.8643083572387695}} +11/06/2021 21:48:00 - INFO - __main__ - Step 3828: {'lr': 0.0004998120211495803, 'samples': 734976, 'steps': 3827, 'loss/train': 1.8643083572387695}} +11/06/2021 21:48:05 - INFO - __main__ - Step 3836: {'lr': 0.0004998103715242875, 'samples': 736512, 'steps': 3835, 'loss/train': 2.376988649368286}}} +11/06/2021 21:48:06 - INFO - __main__ - Step 3840: {'lr': 0.0004998095440101815, 'samples': 737280, 'steps': 3839, 'loss/train': 2.203437089920044}}} +11/06/2021 21:48:08 - INFO - __main__ - Step 3844: {'lr': 0.0004998087146951101, 'samples': 738048, 'steps': 3843, 'loss/train': 0.9520333409309387}} +11/06/2021 21:48:11 - INFO - __main__ - Step 3849: {'lr': 0.0004998076755186727, 'samples': 739008, 'steps': 3848, 'loss/train': 1.7136802673339844}} +11/06/2021 21:48:13 - INFO - __main__ - Step 3854: {'lr': 0.0004998066335282483, 'samples': 739968, 'steps': 3853, 'loss/train': 1.9457613229751587}} +11/06/2021 21:48:13 - INFO - __main__ - Step 3854: {'lr': 0.0004998066335282483, 'samples': 739968, 'steps': 3853, 'loss/train': 1.9457613229751587}} +11/06/2021 21:48:16 - INFO - __main__ - Step 3860: {'lr': 0.0004998053794252925, 'samples': 741120, 'steps': 3859, 'loss/train': 1.1343226432800293}} +11/06/2021 21:48:18 - INFO - __main__ - Step 3865: {'lr': 0.0004998043312441378, 'samples': 742080, 'steps': 3864, 'loss/train': 2.002265214920044}}} +11/06/2021 21:48:18 - INFO - __main__ - Step 3865: {'lr': 0.0004998043312441378, 'samples': 742080, 'steps': 3864, 'loss/train': 2.002265214920044}}} +11/06/2021 21:48:22 - INFO - __main__ - Step 3873: {'lr': 0.0004998026483012803, 'samples': 743616, 'steps': 3872, 'loss/train': 0.3874906599521637}} +11/06/2021 21:48:22 - INFO - __main__ - Step 3873: {'lr': 0.0004998026483012803, 'samples': 743616, 'steps': 3872, 'loss/train': 0.3874906599521637}} +11/06/2021 21:48:26 - INFO - __main__ - Step 3880: {'lr': 0.0004998011698170245, 'samples': 744960, 'steps': 3879, 'loss/train': 2.270320415496826}}} +11/06/2021 21:48:26 - INFO - __main__ - Step 3880: {'lr': 0.0004998011698170245, 'samples': 744960, 'steps': 3879, 'loss/train': 2.270320415496826}}} +11/06/2021 21:48:30 - INFO - __main__ - Step 3888: {'lr': 0.0004997994733673409, 'samples': 746496, 'steps': 3887, 'loss/train': 2.0216381549835205}} +11/06/2021 21:48:32 - INFO - __main__ - Step 3892: {'lr': 0.0004997986224411571, 'samples': 747264, 'steps': 3891, 'loss/train': 1.900480031967163}}} +11/06/2021 21:48:34 - INFO - __main__ - Step 3897: {'lr': 0.0004997975562509315, 'samples': 748224, 'steps': 3896, 'loss/train': 1.9882245063781738}} +11/06/2021 21:48:37 - INFO - __main__ - Step 3902: {'lr': 0.0004997964872468327, 'samples': 749184, 'steps': 3901, 'loss/train': 2.4843428134918213}} +11/06/2021 21:48:39 - INFO - __main__ - Step 3906: {'lr': 0.0004997956300175732, 'samples': 749952, 'steps': 3905, 'loss/train': 2.6430604457855225}} +11/06/2021 21:48:39 - INFO - __main__ - Step 3906: {'lr': 0.0004997956300175732, 'samples': 749952, 'steps': 3905, 'loss/train': 2.6430604457855225}} +11/06/2021 21:48:42 - INFO - __main__ - Step 3913: {'lr': 0.0004997941255330416, 'samples': 751296, 'steps': 3912, 'loss/train': 1.9108836650848389}} +11/06/2021 21:48:44 - INFO - __main__ - Step 3918: {'lr': 0.00049979304752463, 'samples': 752256, 'steps': 3917, 'loss/train': 1.5085346698760986}9}} +11/06/2021 21:48:47 - INFO - __main__ - Step 3923: {'lr': 0.0004997919667023962, 'samples': 753216, 'steps': 3922, 'loss/train': 6.834549903869629}}} +11/06/2021 21:48:47 - INFO - __main__ - Step 3923: {'lr': 0.0004997919667023962, 'samples': 753216, 'steps': 3922, 'loss/train': 6.834549903869629}}} +11/06/2021 21:48:50 - INFO - __main__ - Step 3930: {'lr': 0.0004997904488240704, 'samples': 754560, 'steps': 3929, 'loss/train': 1.9056246280670166}} +11/06/2021 21:48:52 - INFO - __main__ - Step 3934: {'lr': 0.000499789578988887, 'samples': 755328, 'steps': 3933, 'loss/train': 2.532392740249634}6}} +11/06/2021 21:48:54 - INFO - __main__ - Step 3939: {'lr': 0.0004997884891625037, 'samples': 756288, 'steps': 3938, 'loss/train': 2.200429916381836}}} +11/06/2021 21:48:57 - INFO - __main__ - Step 3944: {'lr': 0.0004997873965223495, 'samples': 757248, 'steps': 3943, 'loss/train': 2.6807804107666016}} +11/06/2021 21:48:57 - INFO - __main__ - Step 3944: {'lr': 0.0004997873965223495, 'samples': 757248, 'steps': 3943, 'loss/train': 2.6807804107666016}} +11/06/2021 21:49:00 - INFO - __main__ - Step 3951: {'lr': 0.0004997858620990217, 'samples': 758592, 'steps': 3950, 'loss/train': 1.9574391841888428}} +11/06/2021 21:49:02 - INFO - __main__ - Step 3955: {'lr': 0.0004997849828095969, 'samples': 759360, 'steps': 3954, 'loss/train': 2.0461413860321045}} +11/06/2021 21:49:05 - INFO - __main__ - Step 3960: {'lr': 0.0004997838811654584, 'samples': 760320, 'steps': 3959, 'loss/train': 2.6631009578704834}} +11/06/2021 21:49:07 - INFO - __main__ - Step 3964: {'lr': 0.0004997829978242693, 'samples': 761088, 'steps': 3963, 'loss/train': 1.9565014839172363}} +11/06/2021 21:49:09 - INFO - __main__ - Step 3968: {'lr': 0.0004997821126823062, 'samples': 761856, 'steps': 3967, 'loss/train': 2.048008680343628}}} +11/06/2021 21:49:10 - INFO - __main__ - Step 3972: {'lr': 0.0004997812257395758, 'samples': 762624, 'steps': 3971, 'loss/train': 0.8743030428886414}} +11/06/2021 21:49:12 - INFO - __main__ - Step 3976: {'lr': 0.0004997803369960844, 'samples': 763392, 'steps': 3975, 'loss/train': 1.4740993976593018}} +11/06/2021 21:49:15 - INFO - __main__ - Step 3981: {'lr': 0.0004997792235344096, 'samples': 764352, 'steps': 3980, 'loss/train': 2.1326520442962646}} +11/06/2021 21:49:17 - INFO - __main__ - Step 3985: {'lr': 0.0004997783307392292, 'samples': 765120, 'steps': 3984, 'loss/train': 1.8312244415283203}} +11/06/2021 21:49:19 - INFO - __main__ - Step 3989: {'lr': 0.0004997774361433086, 'samples': 765888, 'steps': 3988, 'loss/train': 2.3569905757904053}} +11/06/2021 21:49:19 - INFO - __main__ - Step 3989: {'lr': 0.0004997774361433086, 'samples': 765888, 'steps': 3988, 'loss/train': 2.3569905757904053}} +11/06/2021 21:49:22 - INFO - __main__ - Step 3996: {'lr': 0.000499775866267436, 'samples': 767232, 'steps': 3995, 'loss/train': 2.0774638652801514}}} +11/06/2021 21:49:25 - INFO - __main__ - Step 4001: {'lr': 0.0004997747415511704, 'samples': 768192, 'steps': 4000, 'loss/train': 2.3865301609039307}} +11/06/2021 21:49:27 - INFO - __main__ - Step 4005: {'lr': 0.0004997738397523537, 'samples': 768960, 'steps': 4004, 'loss/train': 2.0718185901641846}} +11/06/2021 21:49:29 - INFO - __main__ - Step 4009: {'lr': 0.0004997729361528292, 'samples': 769728, 'steps': 4008, 'loss/train': 2.3731486797332764}} +11/06/2021 21:49:30 - INFO - __main__ - Step 4013: {'lr': 0.0004997720307526034, 'samples': 770496, 'steps': 4012, 'loss/train': 2.1763927936553955}} +11/06/2021 21:49:32 - INFO - __main__ - Step 4017: {'lr': 0.0004997711235516829, 'samples': 771264, 'steps': 4016, 'loss/train': 1.86122727394104}5}} +11/06/2021 21:49:35 - INFO - __main__ - Step 4022: {'lr': 0.0004997699870183151, 'samples': 772224, 'steps': 4021, 'loss/train': 2.2087340354919434}} +11/06/2021 21:49:37 - INFO - __main__ - Step 4026: {'lr': 0.0004997690757658552, 'samples': 772992, 'steps': 4025, 'loss/train': 1.9826215505599976}} +11/06/2021 21:49:39 - INFO - __main__ - Step 4030: {'lr': 0.000499768162712722, 'samples': 773760, 'steps': 4029, 'loss/train': 2.1849615573883057}}} +11/06/2021 21:49:40 - INFO - __main__ - Step 4034: {'lr': 0.0004997672478589219, 'samples': 774528, 'steps': 4033, 'loss/train': 1.615881085395813}}} +11/06/2021 21:49:42 - INFO - __main__ - Step 4038: {'lr': 0.0004997663312044614, 'samples': 775296, 'steps': 4037, 'loss/train': 1.8073010444641113}} +11/06/2021 21:49:45 - INFO - __main__ - Step 4043: {'lr': 0.0004997651828542173, 'samples': 776256, 'steps': 4042, 'loss/train': 2.349440336227417}}} +11/06/2021 21:49:47 - INFO - __main__ - Step 4047: {'lr': 0.0004997642621482955, 'samples': 777024, 'steps': 4046, 'loss/train': 3.536803960800171}}} +11/06/2021 21:49:49 - INFO - __main__ - Step 4051: {'lr': 0.0004997633396417348, 'samples': 777792, 'steps': 4050, 'loss/train': 2.1511425971984863}} +11/06/2021 21:49:51 - INFO - __main__ - Step 4055: {'lr': 0.000499762415334542, 'samples': 778560, 'steps': 4054, 'loss/train': 1.871009111404419}3}} +11/06/2021 21:49:52 - INFO - __main__ - Step 4059: {'lr': 0.0004997614892267238, 'samples': 779328, 'steps': 4058, 'loss/train': 1.7731740474700928}} +11/06/2021 21:49:55 - INFO - __main__ - Step 4064: {'lr': 0.0004997603290598317, 'samples': 780288, 'steps': 4063, 'loss/train': 1.8180835247039795}} +11/06/2021 21:49:57 - INFO - __main__ - Step 4068: {'lr': 0.0004997593989006306, 'samples': 781056, 'steps': 4067, 'loss/train': 1.7563910484313965}} +11/06/2021 21:49:57 - INFO - __main__ - Step 4068: {'lr': 0.0004997593989006306, 'samples': 781056, 'steps': 4067, 'loss/train': 1.7563910484313965}} +11/06/2021 21:50:00 - INFO - __main__ - Step 4074: {'lr': 0.0004997580002856993, 'samples': 782208, 'steps': 4073, 'loss/train': 2.6347973346710205}} +11/06/2021 21:50:02 - INFO - __main__ - Step 4079: {'lr': 0.0004997568316784852, 'samples': 783168, 'steps': 4078, 'loss/train': 2.6030142307281494}} +11/06/2021 21:50:02 - INFO - __main__ - Step 4079: {'lr': 0.0004997568316784852, 'samples': 783168, 'steps': 4078, 'loss/train': 2.6030142307281494}} +11/06/2021 21:50:07 - INFO - __main__ - Step 4087: {'lr': 0.0004997549560550464, 'samples': 784704, 'steps': 4086, 'loss/train': 2.3296737670898438}} +11/06/2021 21:50:08 - INFO - __main__ - Step 4091: {'lr': 0.000499754015542466, 'samples': 785472, 'steps': 4090, 'loss/train': 2.175802707672119}8}} +11/06/2021 21:50:10 - INFO - __main__ - Step 4095: {'lr': 0.0004997530732293209, 'samples': 786240, 'steps': 4094, 'loss/train': 1.8951164484024048}} +11/06/2021 21:50:13 - INFO - __main__ - Step 4100: {'lr': 0.0004997518928058553, 'samples': 787200, 'steps': 4099, 'loss/train': 1.9039506912231445}} +11/06/2021 21:50:15 - INFO - __main__ - Step 4104: {'lr': 0.0004997509464414639, 'samples': 787968, 'steps': 4103, 'loss/train': 1.8288829326629639}} +11/06/2021 21:50:17 - INFO - __main__ - Step 4108: {'lr': 0.0004997499982765299, 'samples': 788736, 'steps': 4107, 'loss/train': 2.3028995990753174}} +11/06/2021 21:50:17 - INFO - __main__ - Step 4108: {'lr': 0.0004997499982765299, 'samples': 788736, 'steps': 4107, 'loss/train': 2.3028995990753174}} +11/06/2021 21:50:20 - INFO - __main__ - Step 4115: {'lr': 0.0004997483346553597, 'samples': 790080, 'steps': 4114, 'loss/train': 2.204193592071533}}} +11/06/2021 21:50:23 - INFO - __main__ - Step 4120: {'lr': 0.0004997471429785394, 'samples': 791040, 'steps': 4119, 'loss/train': 2.340329170227051}}} +11/06/2021 21:50:25 - INFO - __main__ - Step 4125: {'lr': 0.0004997459484884139, 'samples': 792000, 'steps': 4124, 'loss/train': 2.5181665420532227}} +11/06/2021 21:50:27 - INFO - __main__ - Step 4129: {'lr': 0.0004997449908707428, 'samples': 792768, 'steps': 4128, 'loss/train': 1.6142773628234863}} +11/06/2021 21:50:29 - INFO - __main__ - Step 4133: {'lr': 0.0004997440314525718, 'samples': 793536, 'steps': 4132, 'loss/train': 1.7447444200515747}} +11/06/2021 21:50:30 - INFO - __main__ - Step 4137: {'lr': 0.000499743070233908, 'samples': 794304, 'steps': 4136, 'loss/train': 2.2369892597198486}}} +11/06/2021 21:50:33 - INFO - __main__ - Step 4141: {'lr': 0.0004997421072147581, 'samples': 795072, 'steps': 4140, 'loss/train': 2.0105512142181396}} +11/06/2021 21:50:35 - INFO - __main__ - Step 4146: {'lr': 0.0004997409009088979, 'samples': 796032, 'steps': 4145, 'loss/train': 2.225456476211548}}} +11/06/2021 21:50:35 - INFO - __main__ - Step 4146: {'lr': 0.0004997409009088979, 'samples': 796032, 'steps': 4145, 'loss/train': 2.225456476211548}}} +11/06/2021 21:50:39 - INFO - __main__ - Step 4154: {'lr': 0.0004997389649679987, 'samples': 797568, 'steps': 4153, 'loss/train': 1.9823795557022095}} +11/06/2021 21:50:41 - INFO - __main__ - Step 4158: {'lr': 0.0004997379942968611, 'samples': 798336, 'steps': 4157, 'loss/train': 2.2602744102478027}} +11/06/2021 21:50:42 - INFO - __main__ - Step 4162: {'lr': 0.0004997370218252741, 'samples': 799104, 'steps': 4161, 'loss/train': 1.6607433557510376}} +11/06/2021 21:50:45 - INFO - __main__ - Step 4166: {'lr': 0.0004997360475532447, 'samples': 799872, 'steps': 4165, 'loss/train': 2.014327049255371}}} +11/06/2021 21:50:47 - INFO - __main__ - Step 4171: {'lr': 0.0004997348271813466, 'samples': 800832, 'steps': 4170, 'loss/train': 2.2488949298858643}} +11/06/2021 21:50:47 - INFO - __main__ - Step 4171: {'lr': 0.0004997348271813466, 'samples': 800832, 'steps': 4170, 'loss/train': 2.2488949298858643}} +11/06/2021 21:50:51 - INFO - __main__ - Step 4179: {'lr': 0.000499732868734929, 'samples': 802368, 'steps': 4178, 'loss/train': 1.4197605848312378}}} +11/06/2021 21:50:53 - INFO - __main__ - Step 4183: {'lr': 0.0004997318868110981, 'samples': 803136, 'steps': 4182, 'loss/train': 2.6250104904174805}} +11/06/2021 21:50:55 - INFO - __main__ - Step 4187: {'lr': 0.0004997309030868617, 'samples': 803904, 'steps': 4186, 'loss/train': 1.2969268560409546}} +11/06/2021 21:50:57 - INFO - __main__ - Step 4192: {'lr': 0.000499729670899757, 'samples': 804864, 'steps': 4191, 'loss/train': 2.5529255867004395}}} +11/06/2021 21:50:57 - INFO - __main__ - Step 4192: {'lr': 0.000499729670899757, 'samples': 804864, 'steps': 4191, 'loss/train': 2.5529255867004395}}} +11/06/2021 21:51:01 - INFO - __main__ - Step 4199: {'lr': 0.0004997279411117916, 'samples': 806208, 'steps': 4198, 'loss/train': 0.3961840569972992}} +11/06/2021 21:51:03 - INFO - __main__ - Step 4203: {'lr': 0.000499726950186005, 'samples': 806976, 'steps': 4202, 'loss/train': 2.567746639251709}2}} +11/06/2021 21:51:05 - INFO - __main__ - Step 4208: {'lr': 0.0004997257089970024, 'samples': 807936, 'steps': 4207, 'loss/train': 2.0918617248535156}} +11/06/2021 21:51:07 - INFO - __main__ - Step 4212: {'lr': 0.0004997247140203939, 'samples': 808704, 'steps': 4211, 'loss/train': 2.0272629261016846}} +11/06/2021 21:51:09 - INFO - __main__ - Step 4216: {'lr': 0.0004997237172434316, 'samples': 809472, 'steps': 4215, 'loss/train': 1.893647313117981}}} +11/06/2021 21:51:09 - INFO - __main__ - Step 4216: {'lr': 0.0004997237172434316, 'samples': 809472, 'steps': 4215, 'loss/train': 1.893647313117981}}} +11/06/2021 21:51:13 - INFO - __main__ - Step 4223: {'lr': 0.0004997219685516684, 'samples': 810816, 'steps': 4222, 'loss/train': 2.0050837993621826}} +11/06/2021 21:51:15 - INFO - __main__ - Step 4228: {'lr': 0.0004997207161104951, 'samples': 811776, 'steps': 4227, 'loss/train': 2.2613799571990967}} +11/06/2021 21:51:15 - INFO - __main__ - Step 4228: {'lr': 0.0004997207161104951, 'samples': 811776, 'steps': 4227, 'loss/train': 2.2613799571990967}} +11/06/2021 21:51:19 - INFO - __main__ - Step 4236: {'lr': 0.0004997187063535679, 'samples': 813312, 'steps': 4235, 'loss/train': 2.289562463760376}}} +11/06/2021 21:51:21 - INFO - __main__ - Step 4240: {'lr': 0.0004997176987746352, 'samples': 814080, 'steps': 4239, 'loss/train': 2.1802866458892822}} +11/06/2021 21:51:21 - INFO - __main__ - Step 4240: {'lr': 0.0004997176987746352, 'samples': 814080, 'steps': 4239, 'loss/train': 2.1802866458892822}} +11/06/2021 21:51:25 - INFO - __main__ - Step 4248: {'lr': 0.0004997156782158679, 'samples': 815616, 'steps': 4247, 'loss/train': 2.169619083404541}}} +11/06/2021 21:51:27 - INFO - __main__ - Step 4252: {'lr': 0.0004997146652360478, 'samples': 816384, 'steps': 4251, 'loss/train': 1.8407737016677856}} +11/06/2021 21:51:29 - INFO - __main__ - Step 4256: {'lr': 0.0004997136504559465, 'samples': 817152, 'steps': 4255, 'loss/train': 1.9230844974517822}} +11/06/2021 21:51:31 - INFO - __main__ - Step 4260: {'lr': 0.0004997126338755714, 'samples': 817920, 'steps': 4259, 'loss/train': 2.247880697250366}}} +11/06/2021 21:51:31 - INFO - __main__ - Step 4260: {'lr': 0.0004997126338755714, 'samples': 817920, 'steps': 4259, 'loss/train': 2.247880697250366}}} +11/06/2021 21:51:35 - INFO - __main__ - Step 4268: {'lr': 0.0004997105953140288, 'samples': 819456, 'steps': 4267, 'loss/train': 1.6954803466796875}} +11/06/2021 21:51:37 - INFO - __main__ - Step 4272: {'lr': 0.0004997095733328761, 'samples': 820224, 'steps': 4271, 'loss/train': 2.232881784439087}}} +11/06/2021 21:51:39 - INFO - __main__ - Step 4276: {'lr': 0.0004997085495514788, 'samples': 820992, 'steps': 4275, 'loss/train': 2.0807552337646484}} +11/06/2021 21:51:41 - INFO - __main__ - Step 4281: {'lr': 0.0004997072672931497, 'samples': 821952, 'steps': 4280, 'loss/train': 2.4467787742614746}} +11/06/2021 21:51:44 - INFO - __main__ - Step 4285: {'lr': 0.0004997062394612293, 'samples': 822720, 'steps': 4284, 'loss/train': 2.1867868900299072}} +11/06/2021 21:51:46 - INFO - __main__ - Step 4289: {'lr': 0.0004997052098290886, 'samples': 823488, 'steps': 4288, 'loss/train': 2.015610694885254}}} +11/06/2021 21:51:47 - INFO - __main__ - Step 4293: {'lr': 0.0004997041783967348, 'samples': 824256, 'steps': 4292, 'loss/train': 2.276956558227539}}} +11/06/2021 21:51:49 - INFO - __main__ - Step 4297: {'lr': 0.0004997031451641754, 'samples': 825024, 'steps': 4296, 'loss/train': 1.8525234460830688}} +11/06/2021 21:51:52 - INFO - __main__ - Step 4302: {'lr': 0.0004997018510919483, 'samples': 825984, 'steps': 4301, 'loss/train': 1.1239334344863892}} +11/06/2021 21:51:54 - INFO - __main__ - Step 4306: {'lr': 0.0004997008138089536, 'samples': 826752, 'steps': 4305, 'loss/train': 2.289822816848755}}} +11/06/2021 21:51:56 - INFO - __main__ - Step 4310: {'lr': 0.0004996997747257775, 'samples': 827520, 'steps': 4309, 'loss/train': 2.347663640975952}}} +11/06/2021 21:51:57 - INFO - __main__ - Step 4314: {'lr': 0.0004996987338424276, 'samples': 828288, 'steps': 4313, 'loss/train': 2.120884418487549}}} +11/06/2021 21:51:59 - INFO - __main__ - Step 4318: {'lr': 0.0004996976911589114, 'samples': 829056, 'steps': 4317, 'loss/train': 1.8161555528640747}} +11/06/2021 21:52:02 - INFO - __main__ - Step 4323: {'lr': 0.0004996963852730436, 'samples': 830016, 'steps': 4322, 'loss/train': 1.9152145385742188}} +11/06/2021 21:52:04 - INFO - __main__ - Step 4327: {'lr': 0.0004996953385391806, 'samples': 830784, 'steps': 4326, 'loss/train': 2.2413148880004883}} +11/06/2021 21:52:04 - INFO - __main__ - Step 4327: {'lr': 0.0004996953385391806, 'samples': 830784, 'steps': 4326, 'loss/train': 2.2413148880004883}} +11/06/2021 21:52:07 - INFO - __main__ - Step 4334: {'lr': 0.0004996935024233335, 'samples': 832128, 'steps': 4333, 'loss/train': 2.192603349685669}}} +11/06/2021 21:52:09 - INFO - __main__ - Step 4338: {'lr': 0.0004996924507390985, 'samples': 832896, 'steps': 4337, 'loss/train': 2.24872088432312}}}} +11/06/2021 21:52:12 - INFO - __main__ - Step 4344: {'lr': 0.0004996908698375216, 'samples': 834048, 'steps': 4343, 'loss/train': 1.9386653900146484}} +11/06/2021 21:52:14 - INFO - __main__ - Step 4348: {'lr': 0.0004996898136529982, 'samples': 834816, 'steps': 4347, 'loss/train': 2.482868194580078}}} +11/06/2021 21:52:16 - INFO - __main__ - Step 4352: {'lr': 0.0004996887556683729, 'samples': 835584, 'steps': 4351, 'loss/train': 2.027623414993286}}} +11/06/2021 21:52:16 - INFO - __main__ - Step 4352: {'lr': 0.0004996887556683729, 'samples': 835584, 'steps': 4351, 'loss/train': 2.027623414993286}}} +11/06/2021 21:52:19 - INFO - __main__ - Step 4359: {'lr': 0.0004996868998638059, 'samples': 836928, 'steps': 4358, 'loss/train': 2.3234333992004395}} +11/06/2021 21:52:22 - INFO - __main__ - Step 4364: {'lr': 0.000499685570913961, 'samples': 837888, 'steps': 4363, 'loss/train': 1.978306770324707}5}} +11/06/2021 21:52:24 - INFO - __main__ - Step 4368: {'lr': 0.0004996845057290039, 'samples': 838656, 'steps': 4367, 'loss/train': 2.1156513690948486}} +11/06/2021 21:52:25 - INFO - __main__ - Step 4372: {'lr': 0.0004996834387439831, 'samples': 839424, 'steps': 4371, 'loss/train': 2.4186854362487793}} +11/06/2021 21:52:27 - INFO - __main__ - Step 4376: {'lr': 0.0004996823699589062, 'samples': 840192, 'steps': 4375, 'loss/train': 2.005566120147705}}} +11/06/2021 21:52:30 - INFO - __main__ - Step 4381: {'lr': 0.0004996810314462429, 'samples': 841152, 'steps': 4380, 'loss/train': 1.7387698888778687}} +11/06/2021 21:52:32 - INFO - __main__ - Step 4385: {'lr': 0.0004996799586110681, 'samples': 841920, 'steps': 4384, 'loss/train': 2.161149501800537}}} +11/06/2021 21:52:34 - INFO - __main__ - Step 4389: {'lr': 0.0004996788839758622, 'samples': 842688, 'steps': 4388, 'loss/train': 2.4196763038635254}} +11/06/2021 21:52:35 - INFO - __main__ - Step 4393: {'lr': 0.0004996778075406331, 'samples': 843456, 'steps': 4392, 'loss/train': 1.8474143743515015}} +11/06/2021 21:52:37 - INFO - __main__ - Step 4397: {'lr': 0.0004996767293053885, 'samples': 844224, 'steps': 4396, 'loss/train': 1.8675569295883179}} +11/06/2021 21:52:40 - INFO - __main__ - Step 4402: {'lr': 0.0004996753789800729, 'samples': 845184, 'steps': 4401, 'loss/train': 2.3262462615966797}} +11/06/2021 21:52:42 - INFO - __main__ - Step 4406: {'lr': 0.0004996742966948219, 'samples': 845952, 'steps': 4405, 'loss/train': 1.8191969394683838}} +11/06/2021 21:52:44 - INFO - __main__ - Step 4410: {'lr': 0.0004996732126095807, 'samples': 846720, 'steps': 4409, 'loss/train': 1.7854758501052856}} +11/06/2021 21:52:44 - INFO - __main__ - Step 4410: {'lr': 0.0004996732126095807, 'samples': 846720, 'steps': 4409, 'loss/train': 1.7854758501052856}} +11/06/2021 21:52:47 - INFO - __main__ - Step 4417: {'lr': 0.000499671311129206, 'samples': 848064, 'steps': 4416, 'loss/train': 1.7873398065567017}}} +11/06/2021 21:52:50 - INFO - __main__ - Step 4422: {'lr': 0.0004996699495539947, 'samples': 849024, 'steps': 4421, 'loss/train': 2.1597673892974854}} +11/06/2021 21:52:52 - INFO - __main__ - Step 4427: {'lr': 0.0004996685851663477, 'samples': 849984, 'steps': 4426, 'loss/train': 2.1259970664978027}} +11/06/2021 21:52:54 - INFO - __main__ - Step 4431: {'lr': 0.0004996674916312867, 'samples': 850752, 'steps': 4430, 'loss/train': 2.205284595489502}}} +11/06/2021 21:52:54 - INFO - __main__ - Step 4431: {'lr': 0.0004996674916312867, 'samples': 850752, 'steps': 4430, 'loss/train': 2.205284595489502}}} +11/06/2021 21:52:57 - INFO - __main__ - Step 4438: {'lr': 0.0004996655736138265, 'samples': 852096, 'steps': 4437, 'loss/train': 2.149383783340454}}} +11/06/2021 21:52:57 - INFO - __main__ - Step 4438: {'lr': 0.0004996655736138265, 'samples': 852096, 'steps': 4437, 'loss/train': 2.149383783340454}}} +11/06/2021 21:53:01 - INFO - __main__ - Step 4446: {'lr': 0.0004996633748441472, 'samples': 853632, 'steps': 4445, 'loss/train': 2.116128444671631}}} +11/06/2021 21:53:04 - INFO - __main__ - Step 4450: {'lr': 0.0004996622727594363, 'samples': 854400, 'steps': 4449, 'loss/train': 1.287934422492981}}} +11/06/2021 21:53:06 - INFO - __main__ - Step 4455: {'lr': 0.0004996608926224345, 'samples': 855360, 'steps': 4454, 'loss/train': 2.0416908264160156}} +11/06/2021 21:53:08 - INFO - __main__ - Step 4459: {'lr': 0.0004996597864879521, 'samples': 856128, 'steps': 4458, 'loss/train': 2.2517218589782715}} +11/06/2021 21:53:10 - INFO - __main__ - Step 4463: {'lr': 0.0004996586785535841, 'samples': 856896, 'steps': 4462, 'loss/train': 2.0258359909057617}} +11/06/2021 21:53:12 - INFO - __main__ - Step 4467: {'lr': 0.0004996575688193386, 'samples': 857664, 'steps': 4466, 'loss/train': 1.737178087234497}}} +11/06/2021 21:53:14 - INFO - __main__ - Step 4471: {'lr': 0.0004996564572852235, 'samples': 858432, 'steps': 4470, 'loss/train': 2.0802853107452393}} +11/06/2021 21:53:14 - INFO - __main__ - Step 4471: {'lr': 0.0004996564572852235, 'samples': 858432, 'steps': 4470, 'loss/train': 2.0802853107452393}} +11/06/2021 21:53:18 - INFO - __main__ - Step 4479: {'lr': 0.0004996542288174166, 'samples': 859968, 'steps': 4478, 'loss/train': 2.4320411682128906}} +11/06/2021 21:53:19 - INFO - __main__ - Step 4483: {'lr': 0.000499653111883741, 'samples': 860736, 'steps': 4482, 'loss/train': 2.1700544357299805}}} +11/06/2021 21:53:21 - INFO - __main__ - Step 4487: {'lr': 0.0004996519931502279, 'samples': 861504, 'steps': 4486, 'loss/train': 2.3324050903320312}} +11/06/2021 21:53:24 - INFO - __main__ - Step 4492: {'lr': 0.0004996505922023274, 'samples': 862464, 'steps': 4491, 'loss/train': 2.6008143424987793}} +11/06/2021 21:53:26 - INFO - __main__ - Step 4497: {'lr': 0.0004996491884422092, 'samples': 863424, 'steps': 4496, 'loss/train': 2.276155948638916}}} +11/06/2021 21:53:28 - INFO - __main__ - Step 4501: {'lr': 0.0004996480634093287, 'samples': 864192, 'steps': 4500, 'loss/train': 1.751892328262329}}} +11/06/2021 21:53:30 - INFO - __main__ - Step 4505: {'lr': 0.0004996469365766471, 'samples': 864960, 'steps': 4504, 'loss/train': 1.7238401174545288}} +11/06/2021 21:53:32 - INFO - __main__ - Step 4509: {'lr': 0.0004996458079441727, 'samples': 865728, 'steps': 4508, 'loss/train': 1.8585339784622192}} +11/06/2021 21:53:34 - INFO - __main__ - Step 4513: {'lr': 0.0004996446775119134, 'samples': 866496, 'steps': 4512, 'loss/train': 1.8141558170318604}} +11/06/2021 21:53:36 - INFO - __main__ - Step 4517: {'lr': 0.0004996435452798775, 'samples': 867264, 'steps': 4516, 'loss/train': 1.8776859045028687}} +11/06/2021 21:53:38 - INFO - __main__ - Step 4522: {'lr': 0.0004996421274589091, 'samples': 868224, 'steps': 4521, 'loss/train': 2.311401128768921}}} +11/06/2021 21:53:40 - INFO - __main__ - Step 4526: {'lr': 0.0004996409911774056, 'samples': 868992, 'steps': 4525, 'loss/train': 1.9752427339553833}} +11/06/2021 21:53:40 - INFO - __main__ - Step 4526: {'lr': 0.0004996409911774056, 'samples': 868992, 'steps': 4525, 'loss/train': 1.9752427339553833}} +11/06/2021 21:53:44 - INFO - __main__ - Step 4533: {'lr': 0.000499638998354131, 'samples': 870336, 'steps': 4532, 'loss/train': 2.118048667907715}3}} +11/06/2021 21:53:46 - INFO - __main__ - Step 4538: {'lr': 0.0004996375715344278, 'samples': 871296, 'steps': 4537, 'loss/train': 2.1683661937713623}} +11/06/2021 21:53:46 - INFO - __main__ - Step 4538: {'lr': 0.0004996375715344278, 'samples': 871296, 'steps': 4537, 'loss/train': 2.1683661937713623}} +11/06/2021 21:53:49 - INFO - __main__ - Step 4545: {'lr': 0.0004996355692625678, 'samples': 872640, 'steps': 4544, 'loss/train': 2.3875391483306885}} +11/06/2021 21:53:51 - INFO - __main__ - Step 4549: {'lr': 0.0004996344226326137, 'samples': 873408, 'steps': 4548, 'loss/train': 2.1202685832977295}} +11/06/2021 21:53:54 - INFO - __main__ - Step 4554: {'lr': 0.0004996329868143404, 'samples': 874368, 'steps': 4553, 'loss/train': 2.062023639678955}}} +11/06/2021 21:53:54 - INFO - __main__ - Step 4554: {'lr': 0.0004996329868143404, 'samples': 874368, 'steps': 4553, 'loss/train': 2.062023639678955}}} +11/06/2021 21:53:58 - INFO - __main__ - Step 4562: {'lr': 0.0004996306836561094, 'samples': 875904, 'steps': 4561, 'loss/train': 2.1488685607910156}} +11/06/2021 21:53:59 - INFO - __main__ - Step 4566: {'lr': 0.0004996295293774762, 'samples': 876672, 'steps': 4565, 'loss/train': 2.0341947078704834}} +11/06/2021 21:54:01 - INFO - __main__ - Step 4570: {'lr': 0.0004996283732991755, 'samples': 877440, 'steps': 4569, 'loss/train': 2.2277791500091553}} +11/06/2021 21:54:04 - INFO - __main__ - Step 4575: {'lr': 0.0004996269256705301, 'samples': 878400, 'steps': 4574, 'loss/train': 2.103940486907959}}} +11/06/2021 21:54:06 - INFO - __main__ - Step 4580: {'lr': 0.0004996254752299337, 'samples': 879360, 'steps': 4579, 'loss/train': 1.8763165473937988}} +11/06/2021 21:54:06 - INFO - __main__ - Step 4580: {'lr': 0.0004996254752299337, 'samples': 879360, 'steps': 4579, 'loss/train': 1.8763165473937988}} +11/06/2021 21:54:10 - INFO - __main__ - Step 4587: {'lr': 0.0004996234398890521, 'samples': 880704, 'steps': 4586, 'loss/train': 1.3432775735855103}} +11/06/2021 21:54:10 - INFO - __main__ - Step 4587: {'lr': 0.0004996234398890521, 'samples': 880704, 'steps': 4586, 'loss/train': 1.3432775735855103}} +11/06/2021 21:54:13 - INFO - __main__ - Step 4595: {'lr': 0.0004996211070366018, 'samples': 882240, 'steps': 4594, 'loss/train': 2.191429376602173}}} +11/06/2021 21:54:13 - INFO - __main__ - Step 4595: {'lr': 0.0004996211070366018, 'samples': 882240, 'steps': 4594, 'loss/train': 2.191429376602173}}} +11/06/2021 21:54:18 - INFO - __main__ - Step 4604: {'lr': 0.0004996184739732291, 'samples': 883968, 'steps': 4603, 'loss/train': 2.1833322048187256}} +11/06/2021 21:54:18 - INFO - __main__ - Step 4604: {'lr': 0.0004996184739732291, 'samples': 883968, 'steps': 4603, 'loss/train': 2.1833322048187256}} +11/06/2021 21:54:21 - INFO - __main__ - Step 4612: {'lr': 0.0004996161258242025, 'samples': 885504, 'steps': 4611, 'loss/train': 2.7224349975585938}} +11/06/2021 21:54:24 - INFO - __main__ - Step 4617: {'lr': 0.0004996146545756786, 'samples': 886464, 'steps': 4616, 'loss/train': 1.9531595706939697}} +11/06/2021 21:54:26 - INFO - __main__ - Step 4621: {'lr': 0.0004996134755523532, 'samples': 887232, 'steps': 4620, 'loss/train': 1.572229027748108}}} +11/06/2021 21:54:28 - INFO - __main__ - Step 4626: {'lr': 0.0004996119992425782, 'samples': 888192, 'steps': 4625, 'loss/train': 2.1612305641174316}} +11/06/2021 21:54:30 - INFO - __main__ - Step 4630: {'lr': 0.0004996108161702736, 'samples': 888960, 'steps': 4629, 'loss/train': 1.8879029750823975}} +11/06/2021 21:54:30 - INFO - __main__ - Step 4630: {'lr': 0.0004996108161702736, 'samples': 888960, 'steps': 4629, 'loss/train': 1.8879029750823975}} +11/06/2021 21:54:33 - INFO - __main__ - Step 4637: {'lr': 0.0004996087414636207, 'samples': 890304, 'steps': 4636, 'loss/train': 1.917240858078003}}} +11/06/2021 21:54:36 - INFO - __main__ - Step 4642: {'lr': 0.000499607256156199, 'samples': 891264, 'steps': 4641, 'loss/train': 1.8053956031799316}}} +11/06/2021 21:54:38 - INFO - __main__ - Step 4647: {'lr': 0.000499605768037048, 'samples': 892224, 'steps': 4646, 'loss/train': 2.353457450866699}}}} +11/06/2021 21:54:38 - INFO - __main__ - Step 4647: {'lr': 0.000499605768037048, 'samples': 892224, 'steps': 4646, 'loss/train': 2.353457450866699}}}} +11/06/2021 21:54:42 - INFO - __main__ - Step 4654: {'lr': 0.000499603679946563, 'samples': 893568, 'steps': 4653, 'loss/train': 2.03910756111145}}}}} +11/06/2021 21:54:44 - INFO - __main__ - Step 4658: {'lr': 0.0004996024842777106, 'samples': 894336, 'steps': 4657, 'loss/train': 1.9979157447814941}} +11/06/2021 21:54:46 - INFO - __main__ - Step 4663: {'lr': 0.0004996009871611382, 'samples': 895296, 'steps': 4662, 'loss/train': 2.1121556758880615}} +11/06/2021 21:54:46 - INFO - __main__ - Step 4663: {'lr': 0.0004996009871611382, 'samples': 895296, 'steps': 4662, 'loss/train': 2.1121556758880615}} +11/06/2021 21:54:50 - INFO - __main__ - Step 4668: {'lr': 0.0004995994872329069, 'samples': 896256, 'steps': 4667, 'loss/train': 2.1744236946105957}} +11/06/2021 21:54:50 - INFO - __main__ - Step 4668: {'lr': 0.0004995994872329069, 'samples': 896256, 'steps': 4667, 'loss/train': 2.1744236946105957}} +11/06/2021 21:54:53 - INFO - __main__ - Step 4676: {'lr': 0.0004995970814995285, 'samples': 897792, 'steps': 4675, 'loss/train': 1.969705581665039}}} +11/06/2021 21:54:56 - INFO - __main__ - Step 4681: {'lr': 0.0004995955742610635, 'samples': 898752, 'steps': 4680, 'loss/train': 1.9930462837219238}} +11/06/2021 21:54:58 - INFO - __main__ - Step 4686: {'lr': 0.0004995940642110005, 'samples': 899712, 'steps': 4685, 'loss/train': 2.056427478790283}}} +11/06/2021 21:54:58 - INFO - __main__ - Step 4686: {'lr': 0.0004995940642110005, 'samples': 899712, 'steps': 4685, 'loss/train': 2.056427478790283}}} +11/06/2021 21:55:01 - INFO - __main__ - Step 4693: {'lr': 0.0004995919454174603, 'samples': 901056, 'steps': 4692, 'loss/train': 2.0533816814422607}} +11/06/2021 21:55:03 - INFO - __main__ - Step 4697: {'lr': 0.0004995907322041214, 'samples': 901824, 'steps': 4696, 'loss/train': 2.322920560836792}}} +11/06/2021 21:55:06 - INFO - __main__ - Step 4702: {'lr': 0.0004995892131570598, 'samples': 902784, 'steps': 4701, 'loss/train': 1.2235736846923828}} +11/06/2021 21:55:06 - INFO - __main__ - Step 4702: {'lr': 0.0004995892131570598, 'samples': 902784, 'steps': 4701, 'loss/train': 1.2235736846923828}} +11/06/2021 21:55:10 - INFO - __main__ - Step 4710: {'lr': 0.0004995867768337938, 'samples': 904320, 'steps': 4709, 'loss/train': 2.073693037033081}}} +11/06/2021 21:55:12 - INFO - __main__ - Step 4714: {'lr': 0.0004995855559731176, 'samples': 905088, 'steps': 4713, 'loss/train': 2.266838550567627}}} +11/06/2021 21:55:13 - INFO - __main__ - Step 4718: {'lr': 0.000499584333313091, 'samples': 905856, 'steps': 4717, 'loss/train': 1.7350718975067139}}} +11/06/2021 21:55:16 - INFO - __main__ - Step 4723: {'lr': 0.0004995828024577346, 'samples': 906816, 'steps': 4722, 'loss/train': 2.221000909805298}}} +11/06/2021 21:55:18 - INFO - __main__ - Step 4727: {'lr': 0.0004995815757492019, 'samples': 907584, 'steps': 4726, 'loss/train': 1.697227954864502}}} +11/06/2021 21:55:20 - INFO - __main__ - Step 4731: {'lr': 0.0004995803472413474, 'samples': 908352, 'steps': 4730, 'loss/train': 2.062716245651245}}} +11/06/2021 21:55:22 - INFO - __main__ - Step 4735: {'lr': 0.0004995791169341801, 'samples': 909120, 'steps': 4734, 'loss/train': 1.6100257635116577}} +11/06/2021 21:55:24 - INFO - __main__ - Step 4739: {'lr': 0.0004995778848277088, 'samples': 909888, 'steps': 4738, 'loss/train': 1.9893282651901245}} +11/06/2021 21:55:26 - INFO - __main__ - Step 4744: {'lr': 0.0004995763421643621, 'samples': 910848, 'steps': 4743, 'loss/train': 2.054396152496338}}} +11/06/2021 21:55:29 - INFO - __main__ - Step 4749: {'lr': 0.000499574796689634, 'samples': 911808, 'steps': 4748, 'loss/train': 1.5545167922973633}}} +11/06/2021 21:55:29 - INFO - __main__ - Step 4749: {'lr': 0.000499574796689634, 'samples': 911808, 'steps': 4748, 'loss/train': 1.5545167922973633}}} +11/06/2021 21:55:32 - INFO - __main__ - Step 4756: {'lr': 0.0004995726283019275, 'samples': 913152, 'steps': 4755, 'loss/train': 5.469394207000732}}} +11/06/2021 21:55:34 - INFO - __main__ - Step 4760: {'lr': 0.0004995713867492564, 'samples': 913920, 'steps': 4759, 'loss/train': 2.178823471069336}}} +11/06/2021 21:55:37 - INFO - __main__ - Step 4765: {'lr': 0.0004995698322782257, 'samples': 914880, 'steps': 4764, 'loss/train': 1.983769416809082}}} +11/06/2021 21:55:39 - INFO - __main__ - Step 4769: {'lr': 0.0004995685866772586, 'samples': 915648, 'steps': 4768, 'loss/train': 1.642903447151184}}} +11/06/2021 21:55:39 - INFO - __main__ - Step 4769: {'lr': 0.0004995685866772586, 'samples': 915648, 'steps': 4768, 'loss/train': 1.642903447151184}}} +11/06/2021 21:55:42 - INFO - __main__ - Step 4776: {'lr': 0.000499566402546179, 'samples': 916992, 'steps': 4775, 'loss/train': 1.7766259908676147}}} +11/06/2021 21:55:44 - INFO - __main__ - Step 4781: {'lr': 0.0004995648390790249, 'samples': 917952, 'steps': 4780, 'loss/train': 1.954245686531067}}} +11/06/2021 21:55:46 - INFO - __main__ - Step 4785: {'lr': 0.0004995635862811994, 'samples': 918720, 'steps': 4784, 'loss/train': 2.129288911819458}}} +11/06/2021 21:55:46 - INFO - __main__ - Step 4785: {'lr': 0.0004995635862811994, 'samples': 918720, 'steps': 4784, 'loss/train': 2.129288911819458}}} +11/06/2021 21:55:50 - INFO - __main__ - Step 4792: {'lr': 0.0004995613895557048, 'samples': 920064, 'steps': 4791, 'loss/train': 1.883157730102539}}} +11/06/2021 21:55:52 - INFO - __main__ - Step 4796: {'lr': 0.0004995601318101231, 'samples': 920832, 'steps': 4795, 'loss/train': 2.0214784145355225}} +11/06/2021 21:55:54 - INFO - __main__ - Step 4801: {'lr': 0.0004995585570980684, 'samples': 921792, 'steps': 4800, 'loss/train': 2.3950815200805664}} +11/06/2021 21:55:54 - INFO - __main__ - Step 4801: {'lr': 0.0004995585570980684, 'samples': 921792, 'steps': 4800, 'loss/train': 2.3950815200805664}} +11/06/2021 21:55:59 - INFO - __main__ - Step 4809: {'lr': 0.000499556031711532, 'samples': 923328, 'steps': 4808, 'loss/train': 2.4952619075775146}}} +11/06/2021 21:56:00 - INFO - __main__ - Step 4813: {'lr': 0.000499554766319553, 'samples': 924096, 'steps': 4812, 'loss/train': 1.8378645181655884}}} +11/06/2021 21:56:02 - INFO - __main__ - Step 4817: {'lr': 0.0004995534991284455, 'samples': 924864, 'steps': 4816, 'loss/train': 1.8735243082046509}} +11/06/2021 21:56:05 - INFO - __main__ - Step 4822: {'lr': 0.0004995519126095506, 'samples': 925824, 'steps': 4821, 'loss/train': 2.3707022666931152}} +11/06/2021 21:56:05 - INFO - __main__ - Step 4822: {'lr': 0.0004995519126095506, 'samples': 925824, 'steps': 4821, 'loss/train': 2.3707022666931152}} +11/06/2021 21:56:09 - INFO - __main__ - Step 4830: {'lr': 0.0004995493683322259, 'samples': 927360, 'steps': 4829, 'loss/train': 1.904067873954773}}} +11/06/2021 21:56:10 - INFO - __main__ - Step 4834: {'lr': 0.0004995480934949247, 'samples': 928128, 'steps': 4833, 'loss/train': 1.7859026193618774}} +11/06/2021 21:56:12 - INFO - __main__ - Step 4838: {'lr': 0.0004995468168585431, 'samples': 928896, 'steps': 4837, 'loss/train': 1.3020102977752686}} +11/06/2021 21:56:15 - INFO - __main__ - Step 4843: {'lr': 0.0004995452185331235, 'samples': 929856, 'steps': 4842, 'loss/train': 0.33405929803848267} +11/06/2021 21:56:17 - INFO - __main__ - Step 4847: {'lr': 0.0004995439378488449, 'samples': 930624, 'steps': 4846, 'loss/train': 1.7952702045440674}} +11/06/2021 21:56:19 - INFO - __main__ - Step 4851: {'lr': 0.0004995426553655159, 'samples': 931392, 'steps': 4850, 'loss/train': 1.6499428749084473}} +11/06/2021 21:56:20 - INFO - __main__ - Step 4855: {'lr': 0.0004995413710831458, 'samples': 932160, 'steps': 4854, 'loss/train': 2.0572216510772705}} +11/06/2021 21:56:22 - INFO - __main__ - Step 4859: {'lr': 0.0004995400850017438, 'samples': 932928, 'steps': 4858, 'loss/train': 1.930557131767273}}} +11/06/2021 21:56:25 - INFO - __main__ - Step 4864: {'lr': 0.000499538474870117, 'samples': 933888, 'steps': 4863, 'loss/train': 1.7647819519042969}}} +11/06/2021 21:56:27 - INFO - __main__ - Step 4868: {'lr': 0.0004995371847409273, 'samples': 934656, 'steps': 4867, 'loss/train': 0.9957026243209839}} +11/06/2021 21:56:29 - INFO - __main__ - Step 4872: {'lr': 0.0004995358928127359, 'samples': 935424, 'steps': 4871, 'loss/train': 1.3676517009735107}} +11/06/2021 21:56:30 - INFO - __main__ - Step 4876: {'lr': 0.0004995345990855522, 'samples': 936192, 'steps': 4875, 'loss/train': 2.013723850250244}}} +11/06/2021 21:56:32 - INFO - __main__ - Step 4880: {'lr': 0.0004995333035593853, 'samples': 936960, 'steps': 4879, 'loss/train': 1.7942310571670532}} +11/06/2021 21:56:35 - INFO - __main__ - Step 4885: {'lr': 0.0004995316816218712, 'samples': 937920, 'steps': 4884, 'loss/train': 2.102433681488037}}} +11/06/2021 21:56:37 - INFO - __main__ - Step 4890: {'lr': 0.000499530056873479, 'samples': 938880, 'steps': 4889, 'loss/train': 2.1150357723236084}}} +11/06/2021 21:56:37 - INFO - __main__ - Step 4890: {'lr': 0.000499530056873479, 'samples': 938880, 'steps': 4889, 'loss/train': 2.1150357723236084}}} +11/06/2021 21:56:41 - INFO - __main__ - Step 4897: {'lr': 0.0004995277775034894, 'samples': 940224, 'steps': 4896, 'loss/train': 1.8550939559936523}} +11/06/2021 21:56:42 - INFO - __main__ - Step 4901: {'lr': 0.0004995264725328151, 'samples': 940992, 'steps': 4900, 'loss/train': 1.1252635717391968}} +11/06/2021 21:56:44 - INFO - __main__ - Step 4905: {'lr': 0.0004995251657632165, 'samples': 941760, 'steps': 4904, 'loss/train': 1.6950825452804565}} +11/06/2021 21:56:47 - INFO - __main__ - Step 4910: {'lr': 0.0004995235297714951, 'samples': 942720, 'steps': 4909, 'loss/train': 1.769343614578247}}} +11/06/2021 21:56:49 - INFO - __main__ - Step 4914: {'lr': 0.0004995222189543509, 'samples': 943488, 'steps': 4913, 'loss/train': 6.304197311401367}}} +11/06/2021 21:56:51 - INFO - __main__ - Step 4918: {'lr': 0.0004995209063383129, 'samples': 944256, 'steps': 4917, 'loss/train': 1.607182264328003}}} +11/06/2021 21:56:53 - INFO - __main__ - Step 4922: {'lr': 0.0004995195919233906, 'samples': 945024, 'steps': 4921, 'loss/train': 2.1027209758758545}} +11/06/2021 21:56:55 - INFO - __main__ - Step 4926: {'lr': 0.0004995182757095935, 'samples': 945792, 'steps': 4925, 'loss/train': 2.3778295516967773}} +11/06/2021 21:56:55 - INFO - __main__ - Step 4926: {'lr': 0.0004995182757095935, 'samples': 945792, 'steps': 4925, 'loss/train': 2.3778295516967773}} +11/06/2021 21:56:58 - INFO - __main__ - Step 4933: {'lr': 0.0004995159680069346, 'samples': 947136, 'steps': 4932, 'loss/train': 1.8914155960083008}} +11/06/2021 21:57:01 - INFO - __main__ - Step 4937: {'lr': 0.0004995146468462806, 'samples': 947904, 'steps': 4936, 'loss/train': 1.576684832572937}}} +11/06/2021 21:57:03 - INFO - __main__ - Step 4942: {'lr': 0.0004995129928658466, 'samples': 948864, 'steps': 4941, 'loss/train': 1.9636731147766113}} +11/06/2021 21:57:03 - INFO - __main__ - Step 4942: {'lr': 0.0004995129928658466, 'samples': 948864, 'steps': 4941, 'loss/train': 1.9636731147766113}} +11/06/2021 21:57:07 - INFO - __main__ - Step 4950: {'lr': 0.0004995103406509713, 'samples': 950400, 'steps': 4949, 'loss/train': 1.9087032079696655}} +11/06/2021 21:57:09 - INFO - __main__ - Step 4954: {'lr': 0.0004995090118453167, 'samples': 951168, 'steps': 4953, 'loss/train': 1.9926605224609375}} +11/06/2021 21:57:11 - INFO - __main__ - Step 4958: {'lr': 0.0004995076812408636, 'samples': 951936, 'steps': 4957, 'loss/train': 1.9032562971115112}} +11/06/2021 21:57:13 - INFO - __main__ - Step 4963: {'lr': 0.0004995060154557513, 'samples': 952896, 'steps': 4962, 'loss/train': 2.1550307273864746}} +11/06/2021 21:57:13 - INFO - __main__ - Step 4963: {'lr': 0.0004995060154557513, 'samples': 952896, 'steps': 4962, 'loss/train': 2.1550307273864746}} +11/06/2021 21:57:17 - INFO - __main__ - Step 4971: {'lr': 0.0004995033443535541, 'samples': 954432, 'steps': 4970, 'loss/train': 1.7052550315856934}} +11/06/2021 21:57:17 - INFO - __main__ - Step 4971: {'lr': 0.0004995033443535541, 'samples': 954432, 'steps': 4970, 'loss/train': 1.7052550315856934}} +11/06/2021 21:57:21 - INFO - __main__ - Step 4979: {'lr': 0.0004995006660563262, 'samples': 955968, 'steps': 4978, 'loss/train': 2.2604053020477295}} +11/06/2021 21:57:23 - INFO - __main__ - Step 4984: {'lr': 0.0004994989884668665, 'samples': 956928, 'steps': 4983, 'loss/train': 1.7262250185012817}} +11/06/2021 21:57:23 - INFO - __main__ - Step 4984: {'lr': 0.0004994989884668665, 'samples': 956928, 'steps': 4983, 'loss/train': 1.7262250185012817}} +11/06/2021 21:57:27 - INFO - __main__ - Step 4992: {'lr': 0.0004994962984778784, 'samples': 958464, 'steps': 4991, 'loss/train': 0.9767778515815735}} +11/06/2021 21:57:29 - INFO - __main__ - Step 4996: {'lr': 0.000499494950785319, 'samples': 959232, 'steps': 4995, 'loss/train': 0.9503514766693115}}} +11/06/2021 21:57:31 - INFO - __main__ - Step 5000: {'lr': 0.0004994936012940626, 'samples': 960000, 'steps': 4999, 'loss/train': 2.0416653156280518}} +11/06/2021 21:57:33 - INFO - __main__ - Step 5004: {'lr': 0.0004994922500041186, 'samples': 960768, 'steps': 5003, 'loss/train': 1.5910391807556152}} +11/06/2021 21:57:33 - INFO - __main__ - Step 5004: {'lr': 0.0004994922500041186, 'samples': 960768, 'steps': 5003, 'loss/train': 1.5910391807556152}} +11/06/2021 21:57:37 - INFO - __main__ - Step 5012: {'lr': 0.0004994895420282072, 'samples': 962304, 'steps': 5011, 'loss/train': 2.228909969329834}}} +11/06/2021 21:57:39 - INFO - __main__ - Step 5016: {'lr': 0.0004994881853422594, 'samples': 963072, 'steps': 5015, 'loss/train': 1.8377931118011475}} +11/06/2021 21:57:41 - INFO - __main__ - Step 5020: {'lr': 0.000499486826857663, 'samples': 963840, 'steps': 5019, 'loss/train': 1.8107075691223145}}} +11/06/2021 21:57:43 - INFO - __main__ - Step 5025: {'lr': 0.0004994851262225832, 'samples': 964800, 'steps': 5024, 'loss/train': 1.3919230699539185}} +11/06/2021 21:57:45 - INFO - __main__ - Step 5029: {'lr': 0.0004994837636910638, 'samples': 965568, 'steps': 5028, 'loss/train': 1.7136719226837158}} +11/06/2021 21:57:47 - INFO - __main__ - Step 5033: {'lr': 0.0004994823993609279, 'samples': 966336, 'steps': 5032, 'loss/train': 0.8590723872184753}} +11/06/2021 21:57:47 - INFO - __main__ - Step 5033: {'lr': 0.0004994823993609279, 'samples': 966336, 'steps': 5032, 'loss/train': 0.8590723872184753}} +11/06/2021 21:57:51 - INFO - __main__ - Step 5040: {'lr': 0.0004994800074552985, 'samples': 967680, 'steps': 5039, 'loss/train': 1.7678231000900269}} +11/06/2021 21:57:53 - INFO - __main__ - Step 5046: {'lr': 0.0004994779528664095, 'samples': 968832, 'steps': 5045, 'loss/train': 2.0043511390686035}} +11/06/2021 21:57:55 - INFO - __main__ - Step 5050: {'lr': 0.000499476580892263, 'samples': 969600, 'steps': 5049, 'loss/train': 1.4724314212799072}}} +11/06/2021 21:57:58 - INFO - __main__ - Step 5054: {'lr': 0.000499475207119552, 'samples': 970368, 'steps': 5053, 'loss/train': 2.118231773376465}}}} +11/06/2021 21:58:00 - INFO - __main__ - Step 5058: {'lr': 0.0004994738315482859, 'samples': 971136, 'steps': 5057, 'loss/train': 1.5080969333648682}} +11/06/2021 21:58:01 - INFO - __main__ - Step 5062: {'lr': 0.0004994724541784749, 'samples': 971904, 'steps': 5061, 'loss/train': 2.3541839122772217}} +11/06/2021 21:58:03 - INFO - __main__ - Step 5066: {'lr': 0.000499471075010129, 'samples': 972672, 'steps': 5065, 'loss/train': 6.243468761444092}7}} +11/06/2021 21:58:03 - INFO - __main__ - Step 5066: {'lr': 0.000499471075010129, 'samples': 972672, 'steps': 5065, 'loss/train': 6.243468761444092}7}} +11/06/2021 21:58:08 - INFO - __main__ - Step 5074: {'lr': 0.0004994683112778718, 'samples': 974208, 'steps': 5073, 'loss/train': 1.9211030006408691}} +11/06/2021 21:58:09 - INFO - __main__ - Step 5078: {'lr': 0.0004994669267139806, 'samples': 974976, 'steps': 5077, 'loss/train': 2.0437135696411133}} +11/06/2021 21:58:11 - INFO - __main__ - Step 5082: {'lr': 0.0004994655403515941, 'samples': 975744, 'steps': 5081, 'loss/train': 1.8559695482254028}} +11/06/2021 21:58:11 - INFO - __main__ - Step 5082: {'lr': 0.0004994655403515941, 'samples': 975744, 'steps': 5081, 'loss/train': 1.8559695482254028}} +11/06/2021 21:58:15 - INFO - __main__ - Step 5090: {'lr': 0.0004994627622313757, 'samples': 977280, 'steps': 5089, 'loss/train': 1.8420456647872925}} +11/06/2021 21:58:17 - INFO - __main__ - Step 5094: {'lr': 0.0004994613704735638, 'samples': 978048, 'steps': 5093, 'loss/train': 2.3359320163726807}} +11/06/2021 21:58:19 - INFO - __main__ - Step 5098: {'lr': 0.0004994599769172967, 'samples': 978816, 'steps': 5097, 'loss/train': 2.2054691314697266}} +11/06/2021 21:58:21 - INFO - __main__ - Step 5103: {'lr': 0.0004994582324429008, 'samples': 979776, 'steps': 5102, 'loss/train': 1.894245982170105}}} +11/06/2021 21:58:21 - INFO - __main__ - Step 5103: {'lr': 0.0004994582324429008, 'samples': 979776, 'steps': 5102, 'loss/train': 1.894245982170105}}} +11/06/2021 21:58:21 - INFO - __main__ - Step 5103: {'lr': 0.0004994582324429008, 'samples': 979776, 'steps': 5102, 'loss/train': 1.894245982170105}}} +11/06/2021 21:58:27 - INFO - __main__ - Step 5114: {'lr': 0.0004994543847078787, 'samples': 981888, 'steps': 5113, 'loss/train': 1.3129998445510864}} +11/06/2021 21:58:29 - INFO - __main__ - Step 5119: {'lr': 0.0004994526312413897, 'samples': 982848, 'steps': 5118, 'loss/train': 1.6690380573272705}} +11/06/2021 21:58:32 - INFO - __main__ - Step 5124: {'lr': 0.000499450874964913, 'samples': 983808, 'steps': 5123, 'loss/train': 2.1291959285736084}}} +11/06/2021 21:58:34 - INFO - __main__ - Step 5128: {'lr': 0.0004994494679205539, 'samples': 984576, 'steps': 5127, 'loss/train': 2.0760858058929443}} +11/06/2021 21:58:34 - INFO - __main__ - Step 5128: {'lr': 0.0004994494679205539, 'samples': 984576, 'steps': 5127, 'loss/train': 2.0760858058929443}} +11/06/2021 21:58:37 - INFO - __main__ - Step 5135: {'lr': 0.0004994470012656052, 'samples': 985920, 'steps': 5134, 'loss/train': 2.2697160243988037}} +11/06/2021 21:58:39 - INFO - __main__ - Step 5140: {'lr': 0.0004994452359973012, 'samples': 986880, 'steps': 5139, 'loss/train': 1.6053614616394043}} +11/06/2021 21:58:39 - INFO - __main__ - Step 5140: {'lr': 0.0004994452359973012, 'samples': 986880, 'steps': 5139, 'loss/train': 1.6053614616394043}} +11/06/2021 21:58:39 - INFO - __main__ - Step 5140: {'lr': 0.0004994452359973012, 'samples': 986880, 'steps': 5139, 'loss/train': 1.6053614616394043}} +11/06/2021 21:58:45 - INFO - __main__ - Step 5151: {'lr': 0.0004994413425161969, 'samples': 988992, 'steps': 5150, 'loss/train': 1.2515465021133423}} +11/06/2021 21:58:47 - INFO - __main__ - Step 5155: {'lr': 0.0004994399233330426, 'samples': 989760, 'steps': 5154, 'loss/train': 2.2096810340881348}} +11/06/2021 21:58:47 - INFO - __main__ - Step 5155: {'lr': 0.0004994399233330426, 'samples': 989760, 'steps': 5154, 'loss/train': 2.2096810340881348}} +11/06/2021 21:58:51 - INFO - __main__ - Step 5163: {'lr': 0.0004994370795718425, 'samples': 991296, 'steps': 5162, 'loss/train': 2.0610859394073486}} +11/06/2021 21:58:53 - INFO - __main__ - Step 5168: {'lr': 0.000499435298568331, 'samples': 992256, 'steps': 5167, 'loss/train': 2.4085593223571777}}} +11/06/2021 21:58:53 - INFO - __main__ - Step 5168: {'lr': 0.000499435298568331, 'samples': 992256, 'steps': 5167, 'loss/train': 2.4085593223571777}}} +11/06/2021 21:58:58 - INFO - __main__ - Step 5176: {'lr': 0.000499432443118353, 'samples': 993792, 'steps': 5175, 'loss/train': 2.3936564922332764}}} +11/06/2021 21:59:00 - INFO - __main__ - Step 5180: {'lr': 0.0004994310126959887, 'samples': 994560, 'steps': 5179, 'loss/train': 1.998255968093872}}} +11/06/2021 21:59:01 - INFO - __main__ - Step 5184: {'lr': 0.0004994295804753885, 'samples': 995328, 'steps': 5183, 'loss/train': 1.9894294738769531}} +11/06/2021 21:59:03 - INFO - __main__ - Step 5188: {'lr': 0.0004994281464565623, 'samples': 996096, 'steps': 5187, 'loss/train': 1.9112964868545532}} +11/06/2021 21:59:03 - INFO - __main__ - Step 5188: {'lr': 0.0004994281464565623, 'samples': 996096, 'steps': 5187, 'loss/train': 1.9112964868545532}} +11/06/2021 21:59:08 - INFO - __main__ - Step 5196: {'lr': 0.0004994252730242734, 'samples': 997632, 'steps': 5195, 'loss/train': 2.2125959396362305}} +11/06/2021 21:59:10 - INFO - __main__ - Step 5200: {'lr': 0.0004994238336108315, 'samples': 998400, 'steps': 5199, 'loss/train': 1.941856861114502}}} +11/06/2021 21:59:11 - INFO - __main__ - Step 5204: {'lr': 0.0004994223923992052, 'samples': 999168, 'steps': 5203, 'loss/train': 1.8816064596176147}} +11/06/2021 21:59:14 - INFO - __main__ - Step 5209: {'lr': 0.000499420588355991, 'samples': 1000128, 'steps': 5208, 'loss/train': 2.1907718181610107}} +11/06/2021 21:59:16 - INFO - __main__ - Step 5213: {'lr': 0.0004994191430984876, 'samples': 1000896, 'steps': 5212, 'loss/train': 1.5323981046676636} +11/06/2021 21:59:18 - INFO - __main__ - Step 5217: {'lr': 0.0004994176960428333, 'samples': 1001664, 'steps': 5216, 'loss/train': 2.4069254398345947} +11/06/2021 21:59:18 - INFO - __main__ - Step 5217: {'lr': 0.0004994176960428333, 'samples': 1001664, 'steps': 5216, 'loss/train': 2.4069254398345947} +11/06/2021 21:59:21 - INFO - __main__ - Step 5224: {'lr': 0.0004994151593686699, 'samples': 1003008, 'steps': 5223, 'loss/train': 0.5793285965919495} +11/06/2021 21:59:24 - INFO - __main__ - Step 5229: {'lr': 0.0004994133440870712, 'samples': 1003968, 'steps': 5228, 'loss/train': 2.3762245178222656} +11/06/2021 21:59:24 - INFO - __main__ - Step 5229: {'lr': 0.0004994133440870712, 'samples': 1003968, 'steps': 5228, 'loss/train': 2.3762245178222656} +11/06/2021 21:59:28 - INFO - __main__ - Step 5236: {'lr': 0.0004994107979728019, 'samples': 1005312, 'steps': 5235, 'loss/train': 1.0656429529190063} +11/06/2021 21:59:29 - INFO - __main__ - Step 5240: {'lr': 0.0004994093405779842, 'samples': 1006080, 'steps': 5239, 'loss/train': 1.9837573766708374} +11/06/2021 21:59:32 - INFO - __main__ - Step 5245: {'lr': 0.0004994075163059134, 'samples': 1007040, 'steps': 5244, 'loss/train': 1.456217646598816}} +11/06/2021 21:59:32 - INFO - __main__ - Step 5245: {'lr': 0.0004994075163059134, 'samples': 1007040, 'steps': 5244, 'loss/train': 1.456217646598816}} +11/06/2021 21:59:36 - INFO - __main__ - Step 5253: {'lr': 0.0004994045916268913, 'samples': 1008576, 'steps': 5252, 'loss/train': 1.8525824546813965} +11/06/2021 21:59:38 - INFO - __main__ - Step 5257: {'lr': 0.0004994031265903063, 'samples': 1009344, 'steps': 5256, 'loss/train': 2.477855920791626}} +11/06/2021 21:59:39 - INFO - __main__ - Step 5261: {'lr': 0.0004994016597556862, 'samples': 1010112, 'steps': 5260, 'loss/train': 2.4520223140716553} +11/06/2021 21:59:42 - INFO - __main__ - Step 5266: {'lr': 0.00049939982368394, 'samples': 1011072, 'steps': 5265, 'loss/train': 1.825718879699707}53} +11/06/2021 21:59:42 - INFO - __main__ - Step 5266: {'lr': 0.00049939982368394, 'samples': 1011072, 'steps': 5265, 'loss/train': 1.825718879699707}53} +11/06/2021 21:59:42 - INFO - __main__ - Step 5266: {'lr': 0.00049939982368394, 'samples': 1011072, 'steps': 5265, 'loss/train': 1.825718879699707}53} +11/06/2021 21:59:47 - INFO - __main__ - Step 5276: {'lr': 0.0004993961431122901, 'samples': 1012992, 'steps': 5275, 'loss/train': 2.171734094619751}} +11/06/2021 21:59:50 - INFO - __main__ - Step 5281: {'lr': 0.0004993942986124278, 'samples': 1013952, 'steps': 5280, 'loss/train': 1.8966882228851318} +11/06/2021 21:59:52 - INFO - __main__ - Step 5286: {'lr': 0.0004993924513032349, 'samples': 1014912, 'steps': 5285, 'loss/train': 2.124772071838379}} +11/06/2021 21:59:54 - INFO - __main__ - Step 5290: {'lr': 0.0004993909714331766, 'samples': 1015680, 'steps': 5289, 'loss/train': 2.3629143238067627} +11/06/2021 21:59:54 - INFO - __main__ - Step 5290: {'lr': 0.0004993909714331766, 'samples': 1015680, 'steps': 5289, 'loss/train': 2.3629143238067627} +11/06/2021 21:59:57 - INFO - __main__ - Step 5297: {'lr': 0.0004993883773342695, 'samples': 1017024, 'steps': 5296, 'loss/train': 1.9744642972946167} +11/06/2021 22:00:00 - INFO - __main__ - Step 5303: {'lr': 0.0004993861494384669, 'samples': 1018176, 'steps': 5302, 'loss/train': 1.8540432453155518} +11/06/2021 22:00:02 - INFO - __main__ - Step 5307: {'lr': 0.0004993846619272052, 'samples': 1018944, 'steps': 5306, 'loss/train': 2.057713508605957}} +11/06/2021 22:00:04 - INFO - __main__ - Step 5311: {'lr': 0.0004993831726180414, 'samples': 1019712, 'steps': 5310, 'loss/train': 0.6815013289451599} +11/06/2021 22:00:04 - INFO - __main__ - Step 5311: {'lr': 0.0004993831726180414, 'samples': 1019712, 'steps': 5310, 'loss/train': 0.6815013289451599} +11/06/2021 22:00:08 - INFO - __main__ - Step 5318: {'lr': 0.0004993805620008353, 'samples': 1021056, 'steps': 5317, 'loss/train': 2.118875026702881}} +11/06/2021 22:00:10 - INFO - __main__ - Step 5323: {'lr': 0.0004993786939032451, 'samples': 1022016, 'steps': 5322, 'loss/train': 1.7816057205200195} +11/06/2021 22:00:10 - INFO - __main__ - Step 5323: {'lr': 0.0004993786939032451, 'samples': 1022016, 'steps': 5322, 'loss/train': 1.7816057205200195} +11/06/2021 22:00:14 - INFO - __main__ - Step 5331: {'lr': 0.0004993756991040675, 'samples': 1023552, 'steps': 5330, 'loss/train': 1.8130137920379639} +11/06/2021 22:00:16 - INFO - __main__ - Step 5335: {'lr': 0.0004993741990077172, 'samples': 1024320, 'steps': 5334, 'loss/train': 2.3342111110687256} +11/06/2021 22:00:18 - INFO - __main__ - Step 5340: {'lr': 0.0004993723213590868, 'samples': 1025280, 'steps': 5339, 'loss/train': 2.2036027908325195} +11/06/2021 22:00:20 - INFO - __main__ - Step 5344: {'lr': 0.0004993708172176417, 'samples': 1026048, 'steps': 5343, 'loss/train': 1.9710315465927124} +11/06/2021 22:00:22 - INFO - __main__ - Step 5349: {'lr': 0.0004993689345126771, 'samples': 1027008, 'steps': 5348, 'loss/train': 2.151108503341675}} +11/06/2021 22:00:24 - INFO - __main__ - Step 5353: {'lr': 0.0004993674263261921, 'samples': 1027776, 'steps': 5352, 'loss/train': 1.639163851737976}} +11/06/2021 22:00:26 - INFO - __main__ - Step 5357: {'lr': 0.0004993659163419294, 'samples': 1028544, 'steps': 5356, 'loss/train': 2.263580322265625}} +11/06/2021 22:00:28 - INFO - __main__ - Step 5361: {'lr': 0.0004993644045598997, 'samples': 1029312, 'steps': 5360, 'loss/train': 2.4149515628814697} +11/06/2021 22:00:30 - INFO - __main__ - Step 5365: {'lr': 0.0004993628909801138, 'samples': 1030080, 'steps': 5364, 'loss/train': 1.8695933818817139} +11/06/2021 22:00:32 - INFO - __main__ - Step 5369: {'lr': 0.000499361375602583, 'samples': 1030848, 'steps': 5368, 'loss/train': 2.0226683616638184}} +11/06/2021 22:00:34 - INFO - __main__ - Step 5374: {'lr': 0.0004993594788526069, 'samples': 1031808, 'steps': 5373, 'loss/train': 2.1130635738372803} +11/06/2021 22:00:37 - INFO - __main__ - Step 5378: {'lr': 0.0004993579594301895, 'samples': 1032576, 'steps': 5377, 'loss/train': 1.8319172859191895} +11/06/2021 22:00:39 - INFO - __main__ - Step 5382: {'lr': 0.0004993564382100624, 'samples': 1033344, 'steps': 5381, 'loss/train': 1.3644241094589233} +11/06/2021 22:00:40 - INFO - __main__ - Step 5386: {'lr': 0.0004993549151922367, 'samples': 1034112, 'steps': 5385, 'loss/train': 2.5312018394470215} +11/06/2021 22:00:42 - INFO - __main__ - Step 5390: {'lr': 0.0004993533903767235, 'samples': 1034880, 'steps': 5389, 'loss/train': 1.5707823038101196} +11/06/2021 22:00:42 - INFO - __main__ - Step 5390: {'lr': 0.0004993533903767235, 'samples': 1034880, 'steps': 5389, 'loss/train': 1.5707823038101196} +11/06/2021 22:00:46 - INFO - __main__ - Step 5398: {'lr': 0.0004993503353526779, 'samples': 1036416, 'steps': 5397, 'loss/train': 1.566808819770813}} +11/06/2021 22:00:48 - INFO - __main__ - Step 5402: {'lr': 0.0004993488051441677, 'samples': 1037184, 'steps': 5401, 'loss/train': 1.2702760696411133} +11/06/2021 22:00:50 - INFO - __main__ - Step 5406: {'lr': 0.000499347273138014, 'samples': 1037952, 'steps': 5405, 'loss/train': 1.485642433166504}3} +11/06/2021 22:00:52 - INFO - __main__ - Step 5411: {'lr': 0.0004993453556024023, 'samples': 1038912, 'steps': 5410, 'loss/train': 1.6171423196792603} +11/06/2021 22:00:55 - INFO - __main__ - Step 5416: {'lr': 0.0004993434352580115, 'samples': 1039872, 'steps': 5415, 'loss/train': 1.5889499187469482} +11/06/2021 22:00:55 - INFO - __main__ - Step 5416: {'lr': 0.0004993434352580115, 'samples': 1039872, 'steps': 5415, 'loss/train': 1.5889499187469482} +11/06/2021 22:00:58 - INFO - __main__ - Step 5422: {'lr': 0.0004993411271371842, 'samples': 1041024, 'steps': 5421, 'loss/train': 1.9106769561767578} +11/06/2021 22:00:58 - INFO - __main__ - Step 5422: {'lr': 0.0004993411271371842, 'samples': 1041024, 'steps': 5421, 'loss/train': 1.9106769561767578} +11/06/2021 22:00:58 - INFO - __main__ - Step 5422: {'lr': 0.0004993411271371842, 'samples': 1041024, 'steps': 5421, 'loss/train': 1.9106769561767578} +11/06/2021 22:01:04 - INFO - __main__ - Step 5433: {'lr': 0.0004993368850777052, 'samples': 1043136, 'steps': 5432, 'loss/train': 2.2101669311523438} +11/06/2021 22:01:06 - INFO - __main__ - Step 5438: {'lr': 0.0004993349523749431, 'samples': 1044096, 'steps': 5437, 'loss/train': 1.8289518356323242} +11/06/2021 22:01:08 - INFO - __main__ - Step 5442: {'lr': 0.0004993334041904957, 'samples': 1044864, 'steps': 5441, 'loss/train': 0.3798553943634033} +11/06/2021 22:01:10 - INFO - __main__ - Step 5446: {'lr': 0.0004993318542085157, 'samples': 1045632, 'steps': 5445, 'loss/train': 2.161842107772827}} +11/06/2021 22:01:12 - INFO - __main__ - Step 5450: {'lr': 0.0004993303024290143, 'samples': 1046400, 'steps': 5449, 'loss/train': 2.0517914295196533} +11/06/2021 22:01:14 - INFO - __main__ - Step 5455: {'lr': 0.0004993283601768902, 'samples': 1047360, 'steps': 5454, 'loss/train': 2.6343281269073486} +11/06/2021 22:01:16 - INFO - __main__ - Step 5459: {'lr': 0.0004993268043530067, 'samples': 1048128, 'steps': 5458, 'loss/train': 1.2634351253509521} +11/06/2021 22:01:16 - INFO - __main__ - Step 5459: {'lr': 0.0004993268043530067, 'samples': 1048128, 'steps': 5458, 'loss/train': 1.2634351253509521} +11/06/2021 22:01:20 - INFO - __main__ - Step 5467: {'lr': 0.000499323687312796, 'samples': 1049664, 'steps': 5466, 'loss/train': 1.905300498008728}1} +11/06/2021 22:01:22 - INFO - __main__ - Step 5471: {'lr': 0.0004993221260964912, 'samples': 1050432, 'steps': 5470, 'loss/train': 2.155994415283203}} +11/06/2021 22:01:24 - INFO - __main__ - Step 5476: {'lr': 0.0004993201720484458, 'samples': 1051392, 'steps': 5475, 'loss/train': 1.8536326885223389} +11/06/2021 22:01:27 - INFO - __main__ - Step 5481: {'lr': 0.0004993182151919049, 'samples': 1052352, 'steps': 5480, 'loss/train': 2.0209407806396484} +11/06/2021 22:01:29 - INFO - __main__ - Step 5485: {'lr': 0.0004993166476845701, 'samples': 1053120, 'steps': 5484, 'loss/train': 2.2243385314941406} +11/06/2021 22:01:29 - INFO - __main__ - Step 5485: {'lr': 0.0004993166476845701, 'samples': 1053120, 'steps': 5484, 'loss/train': 2.2243385314941406} +11/06/2021 22:01:32 - INFO - __main__ - Step 5492: {'lr': 0.000499313900221719, 'samples': 1054464, 'steps': 5491, 'loss/train': 1.8107589483261108}} +11/06/2021 22:01:34 - INFO - __main__ - Step 5497: {'lr': 0.0004993119343781406, 'samples': 1055424, 'steps': 5496, 'loss/train': 1.697355031967163}} +11/06/2021 22:01:36 - INFO - __main__ - Step 5501: {'lr': 0.0004993103596812267, 'samples': 1056192, 'steps': 5500, 'loss/train': 1.8864690065383911} +11/06/2021 22:01:39 - INFO - __main__ - Step 5506: {'lr': 0.0004993083887825393, 'samples': 1057152, 'steps': 5505, 'loss/train': 2.18703556060791}1} +11/06/2021 22:01:41 - INFO - __main__ - Step 5510: {'lr': 0.0004993068100415671, 'samples': 1057920, 'steps': 5509, 'loss/train': 1.877155065536499}} +11/06/2021 22:01:41 - INFO - __main__ - Step 5510: {'lr': 0.0004993068100415671, 'samples': 1057920, 'steps': 5509, 'loss/train': 1.877155065536499}} +11/06/2021 22:01:44 - INFO - __main__ - Step 5517: {'lr': 0.0004993040429200211, 'samples': 1059264, 'steps': 5516, 'loss/train': 2.012702465057373}} +11/06/2021 22:01:46 - INFO - __main__ - Step 5522: {'lr': 0.0004993020630346509, 'samples': 1060224, 'steps': 5521, 'loss/train': 2.444692611694336}} +11/06/2021 22:01:49 - INFO - __main__ - Step 5527: {'lr': 0.0004993000803409891, 'samples': 1061184, 'steps': 5526, 'loss/train': 2.20894455909729}}} +11/06/2021 22:01:51 - INFO - __main__ - Step 5531: {'lr': 0.0004992984921641048, 'samples': 1061952, 'steps': 5530, 'loss/train': 2.0082509517669678} +11/06/2021 22:01:51 - INFO - __main__ - Step 5531: {'lr': 0.0004992984921641048, 'samples': 1061952, 'steps': 5530, 'loss/train': 2.0082509517669678} +11/06/2021 22:01:54 - INFO - __main__ - Step 5538: {'lr': 0.0004992957085298571, 'samples': 1063296, 'steps': 5537, 'loss/train': 1.3260631561279297} +11/06/2021 22:01:56 - INFO - __main__ - Step 5543: {'lr': 0.0004992937168498126, 'samples': 1064256, 'steps': 5542, 'loss/train': 1.7761310338974}97} +11/06/2021 22:01:59 - INFO - __main__ - Step 5548: {'lr': 0.0004992917223615706, 'samples': 1065216, 'steps': 5547, 'loss/train': 1.4636272192001343} +11/06/2021 22:01:59 - INFO - __main__ - Step 5548: {'lr': 0.0004992917223615706, 'samples': 1065216, 'steps': 5547, 'loss/train': 1.4636272192001343} +11/06/2021 22:02:02 - INFO - __main__ - Step 5554: {'lr': 0.000499289325268891, 'samples': 1066368, 'steps': 5553, 'loss/train': 1.8733552694320679}} +11/06/2021 22:02:04 - INFO - __main__ - Step 5558: {'lr': 0.0004992877249605838, 'samples': 1067136, 'steps': 5557, 'loss/train': 2.2034895420074463} +11/06/2021 22:02:06 - INFO - __main__ - Step 5563: {'lr': 0.0004992857220478841, 'samples': 1068096, 'steps': 5562, 'loss/train': 1.9436842203140259} +11/06/2021 22:02:08 - INFO - __main__ - Step 5567: {'lr': 0.0004992841176958858, 'samples': 1068864, 'steps': 5566, 'loss/train': 1.8892325162887573} +11/06/2021 22:02:08 - INFO - __main__ - Step 5567: {'lr': 0.0004992841176958858, 'samples': 1068864, 'steps': 5566, 'loss/train': 1.8892325162887573} +11/06/2021 22:02:12 - INFO - __main__ - Step 5574: {'lr': 0.000499281305755438, 'samples': 1070208, 'steps': 5573, 'loss/train': 1.4345474243164062}} +11/06/2021 22:02:14 - INFO - __main__ - Step 5578: {'lr': 0.0004992796964612302, 'samples': 1070976, 'steps': 5577, 'loss/train': 2.1370227336883545} +11/06/2021 22:02:16 - INFO - __main__ - Step 5583: {'lr': 0.0004992776823162362, 'samples': 1071936, 'steps': 5582, 'loss/train': 1.6253973245620728} +11/06/2021 22:02:19 - INFO - __main__ - Step 5588: {'lr': 0.0004992756653632252, 'samples': 1072896, 'steps': 5587, 'loss/train': 2.1524899005889893} +11/06/2021 22:02:19 - INFO - __main__ - Step 5588: {'lr': 0.0004992756653632252, 'samples': 1072896, 'steps': 5587, 'loss/train': 2.1524899005889893} +11/06/2021 22:02:22 - INFO - __main__ - Step 5595: {'lr': 0.0004992728369115848, 'samples': 1074240, 'steps': 5594, 'loss/train': 0.8529731631278992} +11/06/2021 22:02:24 - INFO - __main__ - Step 5600: {'lr': 0.0004992708132194259, 'samples': 1075200, 'steps': 5599, 'loss/train': 1.7190282344818115} +11/06/2021 22:02:24 - INFO - __main__ - Step 5600: {'lr': 0.0004992708132194259, 'samples': 1075200, 'steps': 5599, 'loss/train': 1.7190282344818115} +11/06/2021 22:02:28 - INFO - __main__ - Step 5608: {'lr': 0.0004992675694714671, 'samples': 1076736, 'steps': 5607, 'loss/train': 2.1556620597839355} +11/06/2021 22:02:28 - INFO - __main__ - Step 5608: {'lr': 0.0004992675694714671, 'samples': 1076736, 'steps': 5607, 'loss/train': 2.1556620597839355} +11/06/2021 22:02:32 - INFO - __main__ - Step 5616: {'lr': 0.0004992643185352765, 'samples': 1078272, 'steps': 5615, 'loss/train': 2.0697097778320312} +11/06/2021 22:02:32 - INFO - __main__ - Step 5616: {'lr': 0.0004992643185352765, 'samples': 1078272, 'steps': 5615, 'loss/train': 2.0697097778320312} +11/06/2021 22:02:37 - INFO - __main__ - Step 5624: {'lr': 0.0004992610604109481, 'samples': 1079808, 'steps': 5623, 'loss/train': 2.165574312210083}} +11/06/2021 22:02:38 - INFO - __main__ - Step 5628: {'lr': 0.0004992594286532615, 'samples': 1080576, 'steps': 5627, 'loss/train': 1.958828330039978}} +11/06/2021 22:02:40 - INFO - __main__ - Step 5632: {'lr': 0.0004992577950985757, 'samples': 1081344, 'steps': 5631, 'loss/train': 2.0259532928466797} +11/06/2021 22:02:42 - INFO - __main__ - Step 5637: {'lr': 0.0004992557506282061, 'samples': 1082304, 'steps': 5636, 'loss/train': 1.9845712184906006} +11/06/2021 22:02:45 - INFO - __main__ - Step 5641: {'lr': 0.000499254113030315, 'samples': 1083072, 'steps': 5640, 'loss/train': 1.8128447532653809}} +11/06/2021 22:02:47 - INFO - __main__ - Step 5645: {'lr': 0.0004992524736354631, 'samples': 1083840, 'steps': 5644, 'loss/train': 2.096315622329712}} +11/06/2021 22:02:49 - INFO - __main__ - Step 5649: {'lr': 0.000499250832443662, 'samples': 1084608, 'steps': 5648, 'loss/train': 2.2662413120269775}} +11/06/2021 22:02:50 - INFO - __main__ - Step 5653: {'lr': 0.0004992491894549236, 'samples': 1085376, 'steps': 5652, 'loss/train': 1.7326874732971191} +11/06/2021 22:02:52 - INFO - __main__ - Step 5657: {'lr': 0.00049924754466926, 'samples': 1086144, 'steps': 5656, 'loss/train': 2.187472105026245}91} +11/06/2021 22:02:55 - INFO - __main__ - Step 5662: {'lr': 0.000499245486160272, 'samples': 1087104, 'steps': 5661, 'loss/train': 1.9282915592193604}} +11/06/2021 22:02:57 - INFO - __main__ - Step 5666: {'lr': 0.0004992438373315694, 'samples': 1087872, 'steps': 5665, 'loss/train': 1.5366052389144897} +11/06/2021 22:02:59 - INFO - __main__ - Step 5670: {'lr': 0.0004992421867059801, 'samples': 1088640, 'steps': 5669, 'loss/train': 1.8856055736541748} +11/06/2021 22:03:00 - INFO - __main__ - Step 5674: {'lr': 0.0004992405342835158, 'samples': 1089408, 'steps': 5673, 'loss/train': 1.913179636001587}} +11/06/2021 22:03:02 - INFO - __main__ - Step 5678: {'lr': 0.0004992388800641885, 'samples': 1090176, 'steps': 5677, 'loss/train': 2.1851115226745605} +11/06/2021 22:03:05 - INFO - __main__ - Step 5683: {'lr': 0.0004992368097632089, 'samples': 1091136, 'steps': 5682, 'loss/train': 2.1074047088623047} +11/06/2021 22:03:07 - INFO - __main__ - Step 5687: {'lr': 0.0004992351515009833, 'samples': 1091904, 'steps': 5686, 'loss/train': 1.8593014478683472} +11/06/2021 22:03:07 - INFO - __main__ - Step 5687: {'lr': 0.0004992351515009833, 'samples': 1091904, 'steps': 5686, 'loss/train': 1.8593014478683472} +11/06/2021 22:03:10 - INFO - __main__ - Step 5694: {'lr': 0.0004992322452184876, 'samples': 1093248, 'steps': 5693, 'loss/train': 2.2784321308135986} +11/06/2021 22:03:12 - INFO - __main__ - Step 5699: {'lr': 0.0004992301659334095, 'samples': 1094208, 'steps': 5698, 'loss/train': 1.779240369796753}} +11/06/2021 22:03:15 - INFO - __main__ - Step 5704: {'lr': 0.0004992280838408496, 'samples': 1095168, 'steps': 5703, 'loss/train': 2.011932611465454}} +11/06/2021 22:03:17 - INFO - __main__ - Step 5708: {'lr': 0.0004992264161454306, 'samples': 1095936, 'steps': 5707, 'loss/train': 2.132072925567627}} +11/06/2021 22:03:17 - INFO - __main__ - Step 5708: {'lr': 0.0004992264161454306, 'samples': 1095936, 'steps': 5707, 'loss/train': 2.132072925567627}} +11/06/2021 22:03:20 - INFO - __main__ - Step 5715: {'lr': 0.000499223493354998, 'samples': 1097280, 'steps': 5714, 'loss/train': 1.668257713317871}}} +11/06/2021 22:03:23 - INFO - __main__ - Step 5720: {'lr': 0.0004992214022786546, 'samples': 1098240, 'steps': 5719, 'loss/train': 2.1646392345428467} +11/06/2021 22:03:25 - INFO - __main__ - Step 5724: {'lr': 0.000499219727396263, 'samples': 1099008, 'steps': 5723, 'loss/train': 1.9365618228912354}} +11/06/2021 22:03:25 - INFO - __main__ - Step 5724: {'lr': 0.000499219727396263, 'samples': 1099008, 'steps': 5723, 'loss/train': 1.9365618228912354}} +11/06/2021 22:03:28 - INFO - __main__ - Step 5731: {'lr': 0.0004992167920287443, 'samples': 1100352, 'steps': 5730, 'loss/train': 1.7039726972579956} +11/06/2021 22:03:31 - INFO - __main__ - Step 5736: {'lr': 0.0004992146919688584, 'samples': 1101312, 'steps': 5735, 'loss/train': 2.2007718086242676} +11/06/2021 22:03:31 - INFO - __main__ - Step 5736: {'lr': 0.0004992146919688584, 'samples': 1101312, 'steps': 5735, 'loss/train': 2.2007718086242676} +11/06/2021 22:03:35 - INFO - __main__ - Step 5744: {'lr': 0.0004992113260338517, 'samples': 1102848, 'steps': 5743, 'loss/train': 1.731091022491455}} +11/06/2021 22:03:37 - INFO - __main__ - Step 5748: {'lr': 0.0004992096403713635, 'samples': 1103616, 'steps': 5747, 'loss/train': 2.426661491394043}} +11/06/2021 22:03:39 - INFO - __main__ - Step 5752: {'lr': 0.0004992079529122351, 'samples': 1104384, 'steps': 5751, 'loss/train': 2.0824427604675293} +11/06/2021 22:03:41 - INFO - __main__ - Step 5757: {'lr': 0.0004992058410618177, 'samples': 1105344, 'steps': 5756, 'loss/train': 1.8771767616271973} +11/06/2021 22:03:43 - INFO - __main__ - Step 5761: {'lr': 0.0004992041495602931, 'samples': 1106112, 'steps': 5760, 'loss/train': 1.8871279954910278} +11/06/2021 22:03:45 - INFO - __main__ - Step 5765: {'lr': 0.0004992024562621678, 'samples': 1106880, 'steps': 5764, 'loss/train': 2.004040479660034}} +11/06/2021 22:03:47 - INFO - __main__ - Step 5769: {'lr': 0.000499200761167454, 'samples': 1107648, 'steps': 5768, 'loss/train': 1.7773163318634033}} +11/06/2021 22:03:49 - INFO - __main__ - Step 5773: {'lr': 0.000499199064276164, 'samples': 1108416, 'steps': 5772, 'loss/train': 2.8149049282073975}} +11/06/2021 22:03:51 - INFO - __main__ - Step 5777: {'lr': 0.0004991973655883099, 'samples': 1109184, 'steps': 5776, 'loss/train': 1.8211041688919067} +11/06/2021 22:03:53 - INFO - __main__ - Step 5782: {'lr': 0.0004991952397020927, 'samples': 1110144, 'steps': 5781, 'loss/train': 1.9769641160964966} +11/06/2021 22:03:55 - INFO - __main__ - Step 5786: {'lr': 0.0004991935369720143, 'samples': 1110912, 'steps': 5785, 'loss/train': 2.5987279415130615} +11/06/2021 22:03:57 - INFO - __main__ - Step 5790: {'lr': 0.0004991918324454117, 'samples': 1111680, 'steps': 5789, 'loss/train': 1.8697025775909424} +11/06/2021 22:03:59 - INFO - __main__ - Step 5794: {'lr': 0.0004991901261222971, 'samples': 1112448, 'steps': 5793, 'loss/train': 2.1112143993377686} +11/06/2021 22:04:01 - INFO - __main__ - Step 5798: {'lr': 0.000499188418002683, 'samples': 1113216, 'steps': 5797, 'loss/train': 2.0395941734313965}} +11/06/2021 22:04:03 - INFO - __main__ - Step 5803: {'lr': 0.0004991862803268564, 'samples': 1114176, 'steps': 5802, 'loss/train': 2.107743501663208}} +11/06/2021 22:04:03 - INFO - __main__ - Step 5803: {'lr': 0.0004991862803268564, 'samples': 1114176, 'steps': 5802, 'loss/train': 2.107743501663208}} +11/06/2021 22:04:07 - INFO - __main__ - Step 5810: {'lr': 0.0004991832828649661, 'samples': 1115520, 'steps': 5809, 'loss/train': 1.6817560195922852} +11/06/2021 22:04:09 - INFO - __main__ - Step 5814: {'lr': 0.0004991815675594768, 'samples': 1116288, 'steps': 5813, 'loss/train': 1.5646218061447144} +11/06/2021 22:04:11 - INFO - __main__ - Step 5819: {'lr': 0.0004991794209013758, 'samples': 1117248, 'steps': 5818, 'loss/train': 1.8572213649749756} +11/06/2021 22:04:13 - INFO - __main__ - Step 5824: {'lr': 0.0004991772714363649, 'samples': 1118208, 'steps': 5823, 'loss/train': 1.790226936340332}} +11/06/2021 22:04:13 - INFO - __main__ - Step 5824: {'lr': 0.0004991772714363649, 'samples': 1118208, 'steps': 5823, 'loss/train': 1.790226936340332}} +11/06/2021 22:04:17 - INFO - __main__ - Step 5831: {'lr': 0.0004991742574697866, 'samples': 1119552, 'steps': 5830, 'loss/train': 1.9625569581985474} +11/06/2021 22:04:19 - INFO - __main__ - Step 5835: {'lr': 0.0004991725327331366, 'samples': 1120320, 'steps': 5834, 'loss/train': 1.6535284519195557} +11/06/2021 22:04:22 - INFO - __main__ - Step 5840: {'lr': 0.0004991703742861762, 'samples': 1121280, 'steps': 5839, 'loss/train': 2.014793872833252}} +11/06/2021 22:04:24 - INFO - __main__ - Step 5844: {'lr': 0.0004991686455077049, 'samples': 1122048, 'steps': 5843, 'loss/train': 2.0172688961029053} +11/06/2021 22:04:25 - INFO - __main__ - Step 5848: {'lr': 0.0004991669149328889, 'samples': 1122816, 'steps': 5847, 'loss/train': 1.8865562677383423} +11/06/2021 22:04:27 - INFO - __main__ - Step 5852: {'lr': 0.0004991651825617406, 'samples': 1123584, 'steps': 5851, 'loss/train': 2.156768560409546}} +11/06/2021 22:04:29 - INFO - __main__ - Step 5856: {'lr': 0.0004991634483942725, 'samples': 1124352, 'steps': 5855, 'loss/train': 1.9906128644943237} +11/06/2021 22:04:29 - INFO - __main__ - Step 5856: {'lr': 0.0004991634483942725, 'samples': 1124352, 'steps': 5855, 'loss/train': 1.9906128644943237} +11/06/2021 22:04:33 - INFO - __main__ - Step 5863: {'lr': 0.0004991604092788465, 'samples': 1125696, 'steps': 5862, 'loss/train': 3.404467821121216}} +11/06/2021 22:04:36 - INFO - __main__ - Step 5868: {'lr': 0.0004991582351140747, 'samples': 1126656, 'steps': 5867, 'loss/train': 1.8088363409042358} +11/06/2021 22:04:38 - INFO - __main__ - Step 5872: {'lr': 0.0004991564937614526, 'samples': 1127424, 'steps': 5871, 'loss/train': 2.1050267219543457} +11/06/2021 22:04:38 - INFO - __main__ - Step 5872: {'lr': 0.0004991564937614526, 'samples': 1127424, 'steps': 5871, 'loss/train': 2.1050267219543457} +11/06/2021 22:04:41 - INFO - __main__ - Step 5879: {'lr': 0.0004991534420721278, 'samples': 1128768, 'steps': 5878, 'loss/train': 1.775754451751709}} +11/06/2021 22:04:43 - INFO - __main__ - Step 5884: {'lr': 0.0004991512589260939, 'samples': 1129728, 'steps': 5883, 'loss/train': 2.0570759773254395} +11/06/2021 22:04:46 - INFO - __main__ - Step 5889: {'lr': 0.0004991490729734672, 'samples': 1130688, 'steps': 5888, 'loss/train': 1.4462894201278687} +11/06/2021 22:04:46 - INFO - __main__ - Step 5889: {'lr': 0.0004991490729734672, 'samples': 1130688, 'steps': 5888, 'loss/train': 1.4462894201278687} +11/06/2021 22:04:48 - INFO - __main__ - Step 5895: {'lr': 0.0004991464461256472, 'samples': 1131840, 'steps': 5894, 'loss/train': 1.8709157705307007} +11/06/2021 22:04:51 - INFO - __main__ - Step 5900: {'lr': 0.0004991442539986029, 'samples': 1132800, 'steps': 5899, 'loss/train': 2.119931697845459}} +11/06/2021 22:04:53 - INFO - __main__ - Step 5905: {'lr': 0.0004991420590650448, 'samples': 1133760, 'steps': 5904, 'loss/train': 1.9303275346755981} +11/06/2021 22:04:53 - INFO - __main__ - Step 5905: {'lr': 0.0004991420590650448, 'samples': 1133760, 'steps': 5904, 'loss/train': 1.9303275346755981} +11/06/2021 22:04:57 - INFO - __main__ - Step 5912: {'lr': 0.0004991389814431672, 'samples': 1135104, 'steps': 5911, 'loss/train': 2.336418390274048}} +11/06/2021 22:04:58 - INFO - __main__ - Step 5916: {'lr': 0.0004991372203324098, 'samples': 1135872, 'steps': 5915, 'loss/train': 1.72451913356781}}} +11/06/2021 22:05:00 - INFO - __main__ - Step 5920: {'lr': 0.0004991354574255344, 'samples': 1136640, 'steps': 5919, 'loss/train': 1.7401177883148193} +11/06/2021 22:05:03 - INFO - __main__ - Step 5925: {'lr': 0.0004991332512661682, 'samples': 1137600, 'steps': 5924, 'loss/train': 1.9979768991470337} +11/06/2021 22:05:03 - INFO - __main__ - Step 5925: {'lr': 0.0004991332512661682, 'samples': 1137600, 'steps': 5924, 'loss/train': 1.9979768991470337} +11/06/2021 22:05:07 - INFO - __main__ - Step 5933: {'lr': 0.0004991297155739015, 'samples': 1139136, 'steps': 5932, 'loss/train': 2.3104774951934814} +11/06/2021 22:05:09 - INFO - __main__ - Step 5937: {'lr': 0.0004991279450336656, 'samples': 1139904, 'steps': 5936, 'loss/train': 2.049226999282837}} +11/06/2021 22:05:11 - INFO - __main__ - Step 5942: {'lr': 0.0004991257293326752, 'samples': 1140864, 'steps': 5941, 'loss/train': 1.340391993522644}} +11/06/2021 22:05:13 - INFO - __main__ - Step 5946: {'lr': 0.0004991239547513419, 'samples': 1141632, 'steps': 5945, 'loss/train': 1.9071139097213745} +11/06/2021 22:05:13 - INFO - __main__ - Step 5946: {'lr': 0.0004991239547513419, 'samples': 1141632, 'steps': 5945, 'loss/train': 1.9071139097213745} +11/06/2021 22:05:17 - INFO - __main__ - Step 5952: {'lr': 0.0004991212895118035, 'samples': 1142784, 'steps': 5951, 'loss/train': 2.292984962463379}} +11/06/2021 22:05:19 - INFO - __main__ - Step 5958: {'lr': 0.0004991186202312576, 'samples': 1143936, 'steps': 5957, 'loss/train': 2.46972393989563}}} +11/06/2021 22:05:22 - INFO - __main__ - Step 5962: {'lr': 0.000499116838465911, 'samples': 1144704, 'steps': 5961, 'loss/train': 2.2520675659179688}} +11/06/2021 22:05:23 - INFO - __main__ - Step 5966: {'lr': 0.0004991150549045931, 'samples': 1145472, 'steps': 5965, 'loss/train': 2.390394926071167}} +11/06/2021 22:05:25 - INFO - __main__ - Step 5970: {'lr': 0.0004991132695473167, 'samples': 1146240, 'steps': 5969, 'loss/train': 1.7997961044311523} +11/06/2021 22:05:27 - INFO - __main__ - Step 5975: {'lr': 0.0004991110353251744, 'samples': 1147200, 'steps': 5974, 'loss/train': 1.894894003868103}} +11/06/2021 22:05:30 - INFO - __main__ - Step 5979: {'lr': 0.0004991092459270388, 'samples': 1147968, 'steps': 5978, 'loss/train': 1.8954336643218994} +11/06/2021 22:05:32 - INFO - __main__ - Step 5983: {'lr': 0.0004991074547329867, 'samples': 1148736, 'steps': 5982, 'loss/train': 2.0363080501556396} +11/06/2021 22:05:33 - INFO - __main__ - Step 5987: {'lr': 0.0004991056617430308, 'samples': 1149504, 'steps': 5986, 'loss/train': 1.5863991975784302} +11/06/2021 22:05:35 - INFO - __main__ - Step 5991: {'lr': 0.0004991038669571844, 'samples': 1150272, 'steps': 5990, 'loss/train': 2.2613940238952637} +11/06/2021 22:05:38 - INFO - __main__ - Step 5996: {'lr': 0.0004991016209494249, 'samples': 1151232, 'steps': 5995, 'loss/train': 1.6935555934906006} +11/06/2021 22:05:40 - INFO - __main__ - Step 6000: {'lr': 0.0004990998221228718, 'samples': 1152000, 'steps': 5999, 'loss/train': 2.1965417861938477} +11/06/2021 22:05:40 - INFO - __main__ - Step 6000: {'lr': 0.0004990998221228718, 'samples': 1152000, 'steps': 5999, 'loss/train': 2.1965417861938477} +11/06/2021 22:05:43 - INFO - __main__ - Step 6007: {'lr': 0.000499096669855151, 'samples': 1153344, 'steps': 6006, 'loss/train': 1.9373234510421753}} +11/06/2021 22:05:45 - INFO - __main__ - Step 6011: {'lr': 0.0004990948660900455, 'samples': 1154112, 'steps': 6010, 'loss/train': 1.6468206644058228} +11/06/2021 22:05:47 - INFO - __main__ - Step 6015: {'lr': 0.0004990930605291272, 'samples': 1154880, 'steps': 6014, 'loss/train': 1.9965391159057617} +11/06/2021 22:05:47 - INFO - __main__ - Step 6015: {'lr': 0.0004990930605291272, 'samples': 1154880, 'steps': 6014, 'loss/train': 1.9965391159057617} +11/06/2021 22:05:51 - INFO - __main__ - Step 6023: {'lr': 0.0004990894440199042, 'samples': 1156416, 'steps': 6022, 'loss/train': 2.2078778743743896} +11/06/2021 22:05:53 - INFO - __main__ - Step 6027: {'lr': 0.0004990876330716256, 'samples': 1157184, 'steps': 6026, 'loss/train': 1.7819007635116577} +11/06/2021 22:05:55 - INFO - __main__ - Step 6032: {'lr': 0.0004990853668609902, 'samples': 1158144, 'steps': 6031, 'loss/train': 1.8239428997039795} +11/06/2021 22:05:57 - INFO - __main__ - Step 6036: {'lr': 0.0004990835518722683, 'samples': 1158912, 'steps': 6035, 'loss/train': 1.736742615699768}} +11/06/2021 22:05:59 - INFO - __main__ - Step 6040: {'lr': 0.0004990817350878152, 'samples': 1159680, 'steps': 6039, 'loss/train': 1.2319962978363037} +11/06/2021 22:06:01 - INFO - __main__ - Step 6044: {'lr': 0.0004990799165076438, 'samples': 1160448, 'steps': 6043, 'loss/train': 0.32099586725234985} +11/06/2021 22:06:03 - INFO - __main__ - Step 6048: {'lr': 0.0004990780961317674, 'samples': 1161216, 'steps': 6047, 'loss/train': 1.82656729221344}85} +11/06/2021 22:06:05 - INFO - __main__ - Step 6052: {'lr': 0.000499076273960199, 'samples': 1161984, 'steps': 6051, 'loss/train': 2.0586600303649902}5} +11/06/2021 22:06:07 - INFO - __main__ - Step 6057: {'lr': 0.0004990739937205668, 'samples': 1162944, 'steps': 6056, 'loss/train': 1.2735779285430908}} +11/06/2021 22:06:09 - INFO - __main__ - Step 6061: {'lr': 0.0004990721675087397, 'samples': 1163712, 'steps': 6060, 'loss/train': 2.1596553325653076}} +11/06/2021 22:06:11 - INFO - __main__ - Step 6065: {'lr': 0.0004990703395012634, 'samples': 1164480, 'steps': 6064, 'loss/train': 2.094088554382324}}} +11/06/2021 22:06:13 - INFO - __main__ - Step 6069: {'lr': 0.000499068509698151, 'samples': 1165248, 'steps': 6068, 'loss/train': 1.7530931234359741}}} +11/06/2021 22:06:15 - INFO - __main__ - Step 6073: {'lr': 0.0004990666780994156, 'samples': 1166016, 'steps': 6072, 'loss/train': 2.116274356842041}}} +11/06/2021 22:06:17 - INFO - __main__ - Step 6078: {'lr': 0.0004990643860759222, 'samples': 1166976, 'steps': 6077, 'loss/train': 1.642020583152771}}} +11/06/2021 22:06:17 - INFO - __main__ - Step 6078: {'lr': 0.0004990643860759222, 'samples': 1166976, 'steps': 6077, 'loss/train': 1.642020583152771}}} +11/06/2021 22:06:17 - INFO - __main__ - Step 6078: {'lr': 0.0004990643860759222, 'samples': 1166976, 'steps': 6077, 'loss/train': 1.642020583152771}}} +11/06/2021 22:06:23 - INFO - __main__ - Step 6090: {'lr': 0.0004990588737726809, 'samples': 1169280, 'steps': 6089, 'loss/train': 2.0593221187591553}} +11/06/2021 22:06:25 - INFO - __main__ - Step 6094: {'lr': 0.0004990570327471427, 'samples': 1170048, 'steps': 6093, 'loss/train': 1.9696969985961914}} +11/06/2021 22:06:27 - INFO - __main__ - Step 6099: {'lr': 0.0004990547289402433, 'samples': 1171008, 'steps': 6098, 'loss/train': 1.9792393445968628}} +11/06/2021 22:06:30 - INFO - __main__ - Step 6104: {'lr': 0.0004990524223278384, 'samples': 1171968, 'steps': 6103, 'loss/train': 1.6591429710388184}} +11/06/2021 22:06:32 - INFO - __main__ - Step 6108: {'lr': 0.0004990505750179682, 'samples': 1172736, 'steps': 6107, 'loss/train': 1.9363466501235962}} +11/06/2021 22:06:34 - INFO - __main__ - Step 6112: {'lr': 0.0004990487259126043, 'samples': 1173504, 'steps': 6111, 'loss/train': 1.6976191997528076}} +11/06/2021 22:06:34 - INFO - __main__ - Step 6112: {'lr': 0.0004990487259126043, 'samples': 1173504, 'steps': 6111, 'loss/train': 1.6976191997528076}} +11/06/2021 22:06:37 - INFO - __main__ - Step 6119: {'lr': 0.0004990454856578513, 'samples': 1174848, 'steps': 6118, 'loss/train': 1.8817105293273926}} +11/06/2021 22:06:40 - INFO - __main__ - Step 6124: {'lr': 0.0004990431678236849, 'samples': 1175808, 'steps': 6123, 'loss/train': 1.8044439554214478}} +11/06/2021 22:06:42 - INFO - __main__ - Step 6128: {'lr': 0.0004990413115364803, 'samples': 1176576, 'steps': 6127, 'loss/train': 1.5602920055389404}} +11/06/2021 22:06:44 - INFO - __main__ - Step 6132: {'lr': 0.000499039453453849, 'samples': 1177344, 'steps': 6131, 'loss/train': 1.8965604305267334}}} +11/06/2021 22:06:45 - INFO - __main__ - Step 6136: {'lr': 0.0004990375935758042, 'samples': 1178112, 'steps': 6135, 'loss/train': 1.5371315479278564}} +11/06/2021 22:06:47 - INFO - __main__ - Step 6140: {'lr': 0.0004990357319023597, 'samples': 1178880, 'steps': 6139, 'loss/train': 1.368839144706726}}} +11/06/2021 22:06:47 - INFO - __main__ - Step 6140: {'lr': 0.0004990357319023597, 'samples': 1178880, 'steps': 6139, 'loss/train': 1.368839144706726}}} +11/06/2021 22:06:52 - INFO - __main__ - Step 6148: {'lr': 0.0004990320031693242, 'samples': 1180416, 'steps': 6147, 'loss/train': 2.2118520736694336}} +11/06/2021 22:06:53 - INFO - __main__ - Step 6152: {'lr': 0.0004990301361097603, 'samples': 1181184, 'steps': 6151, 'loss/train': 1.1245484352111816}} +11/06/2021 22:06:55 - INFO - __main__ - Step 6156: {'lr': 0.0004990282672548503, 'samples': 1181952, 'steps': 6155, 'loss/train': 1.679478645324707}}} +11/06/2021 22:06:57 - INFO - __main__ - Step 6160: {'lr': 0.0004990263966046075, 'samples': 1182720, 'steps': 6159, 'loss/train': 1.8187702894210815}} +11/06/2021 22:07:00 - INFO - __main__ - Step 6166: {'lr': 0.000499023587263024, 'samples': 1183872, 'steps': 6165, 'loss/train': 1.6445512771606445}}} +11/06/2021 22:07:02 - INFO - __main__ - Step 6170: {'lr': 0.0004990217121245084, 'samples': 1184640, 'steps': 6169, 'loss/train': 1.9792548418045044}} +11/06/2021 22:07:02 - INFO - __main__ - Step 6170: {'lr': 0.0004990217121245084, 'samples': 1184640, 'steps': 6169, 'loss/train': 1.9792548418045044}} +11/06/2021 22:07:05 - INFO - __main__ - Step 6177: {'lr': 0.0004990184263122088, 'samples': 1185984, 'steps': 6176, 'loss/train': 1.861528754234314}}} +11/06/2021 22:07:08 - INFO - __main__ - Step 6182: {'lr': 0.0004990160759373033, 'samples': 1186944, 'steps': 6181, 'loss/train': 2.10902738571167}}}} +11/06/2021 22:07:10 - INFO - __main__ - Step 6187: {'lr': 0.0004990137227573278, 'samples': 1187904, 'steps': 6186, 'loss/train': 3.2400269508361816}} +11/06/2021 22:07:12 - INFO - __main__ - Step 6191: {'lr': 0.0004990118381937148, 'samples': 1188672, 'steps': 6190, 'loss/train': 1.4901134967803955}} +11/06/2021 22:07:12 - INFO - __main__ - Step 6191: {'lr': 0.0004990118381937148, 'samples': 1188672, 'steps': 6190, 'loss/train': 1.4901134967803955}} +11/06/2021 22:07:15 - INFO - __main__ - Step 6198: {'lr': 0.0004990085358876658, 'samples': 1190016, 'steps': 6197, 'loss/train': 1.6927975416183472}} +11/06/2021 22:07:17 - INFO - __main__ - Step 6202: {'lr': 0.0004990066463872462, 'samples': 1190784, 'steps': 6201, 'loss/train': 1.7335742712020874}} +11/06/2021 22:07:20 - INFO - __main__ - Step 6207: {'lr': 0.000499004281987256, 'samples': 1191744, 'steps': 6206, 'loss/train': 1.6635841131210327}}} +11/06/2021 22:07:20 - INFO - __main__ - Step 6207: {'lr': 0.000499004281987256, 'samples': 1191744, 'steps': 6206, 'loss/train': 1.6635841131210327}}} +11/06/2021 22:07:23 - INFO - __main__ - Step 6214: {'lr': 0.0004990009671149811, 'samples': 1193088, 'steps': 6213, 'loss/train': 1.9133497476577759}} +11/06/2021 22:07:26 - INFO - __main__ - Step 6218: {'lr': 0.0004989990704339361, 'samples': 1193856, 'steps': 6217, 'loss/train': 1.0167715549468994}} +11/06/2021 22:07:26 - INFO - __main__ - Step 6218: {'lr': 0.0004989990704339361, 'samples': 1193856, 'steps': 6217, 'loss/train': 1.0167715549468994}} +11/06/2021 22:07:30 - INFO - __main__ - Step 6226: {'lr': 0.0004989952716864931, 'samples': 1195392, 'steps': 6225, 'loss/train': 2.1702065467834473}} +11/06/2021 22:07:31 - INFO - __main__ - Step 6230: {'lr': 0.0004989933696201225, 'samples': 1196160, 'steps': 6229, 'loss/train': 1.936288595199585}}} +11/06/2021 22:07:34 - INFO - __main__ - Step 6234: {'lr': 0.0004989914657586707, 'samples': 1196928, 'steps': 6233, 'loss/train': 1.8493226766586304}} +11/06/2021 22:07:36 - INFO - __main__ - Step 6239: {'lr': 0.0004989890834075441, 'samples': 1197888, 'steps': 6238, 'loss/train': 1.5966987609863281}} +11/06/2021 22:07:38 - INFO - __main__ - Step 6243: {'lr': 0.0004989871755072101, 'samples': 1198656, 'steps': 6242, 'loss/train': 1.8593974113464355}} +11/06/2021 22:07:38 - INFO - __main__ - Step 6243: {'lr': 0.0004989871755072101, 'samples': 1198656, 'steps': 6242, 'loss/train': 1.8593974113464355}} +11/06/2021 22:07:41 - INFO - __main__ - Step 6250: {'lr': 0.0004989838323623272, 'samples': 1200000, 'steps': 6249, 'loss/train': 2.3803365230560303}} +11/06/2021 22:07:43 - INFO - __main__ - Step 6254: {'lr': 0.000498981919525676, 'samples': 1200768, 'steps': 6253, 'loss/train': 1.925179362297058}3}} +11/06/2021 22:07:46 - INFO - __main__ - Step 6259: {'lr': 0.0004989795259556469, 'samples': 1201728, 'steps': 6258, 'loss/train': 2.1959168910980225}} +11/06/2021 22:07:48 - INFO - __main__ - Step 6264: {'lr': 0.0004989771295809594, 'samples': 1202688, 'steps': 6263, 'loss/train': 1.5440324544906616}} +11/06/2021 22:07:50 - INFO - __main__ - Step 6268: {'lr': 0.0004989752104618736, 'samples': 1203456, 'steps': 6267, 'loss/train': 2.009376287460327}}} +11/06/2021 22:07:50 - INFO - __main__ - Step 6268: {'lr': 0.0004989752104618736, 'samples': 1203456, 'steps': 6267, 'loss/train': 2.009376287460327}}} +11/06/2021 22:07:53 - INFO - __main__ - Step 6275: {'lr': 0.0004989718476843828, 'samples': 1204800, 'steps': 6274, 'loss/train': 1.9315811395645142}} +11/06/2021 22:07:55 - INFO - __main__ - Step 6279: {'lr': 0.0004989699236292173, 'samples': 1205568, 'steps': 6278, 'loss/train': 1.9111852645874023}} +11/06/2021 22:07:58 - INFO - __main__ - Step 6284: {'lr': 0.0004989675160361669, 'samples': 1206528, 'steps': 6283, 'loss/train': 2.0830070972442627}} +11/06/2021 22:07:58 - INFO - __main__ - Step 6284: {'lr': 0.0004989675160361669, 'samples': 1206528, 'steps': 6283, 'loss/train': 2.0830070972442627}} +11/06/2021 22:08:02 - INFO - __main__ - Step 6292: {'lr': 0.0004989636580538896, 'samples': 1208064, 'steps': 6291, 'loss/train': 1.3750081062316895}} +11/06/2021 22:08:03 - INFO - __main__ - Step 6296: {'lr': 0.0004989617263704437, 'samples': 1208832, 'steps': 6295, 'loss/train': 1.7614363431930542}} +11/06/2021 22:08:06 - INFO - __main__ - Step 6300: {'lr': 0.0004989597928921447, 'samples': 1209600, 'steps': 6299, 'loss/train': 2.2829113006591797}} +11/06/2021 22:08:08 - INFO - __main__ - Step 6305: {'lr': 0.0004989573735202802, 'samples': 1210560, 'steps': 6304, 'loss/train': 1.910634994506836}}} +11/06/2021 22:08:10 - INFO - __main__ - Step 6309: {'lr': 0.000498955436003613, 'samples': 1211328, 'steps': 6308, 'loss/train': 1.7411454916000366}}} +11/06/2021 22:08:12 - INFO - __main__ - Step 6313: {'lr': 0.0004989534966921382, 'samples': 1212096, 'steps': 6312, 'loss/train': 1.8578460216522217}} +11/06/2021 22:08:14 - INFO - __main__ - Step 6317: {'lr': 0.0004989515555858697, 'samples': 1212864, 'steps': 6316, 'loss/train': 2.206059694290161}}} +11/06/2021 22:08:16 - INFO - __main__ - Step 6321: {'lr': 0.0004989496126848215, 'samples': 1213632, 'steps': 6320, 'loss/train': 1.8948540687561035}} +11/06/2021 22:08:18 - INFO - __main__ - Step 6326: {'lr': 0.0004989471815346237, 'samples': 1214592, 'steps': 6325, 'loss/train': 2.1662731170654297}} +11/06/2021 22:08:20 - INFO - __main__ - Step 6330: {'lr': 0.0004989452345953725, 'samples': 1215360, 'steps': 6329, 'loss/train': 1.8572430610656738}} +11/06/2021 22:08:20 - INFO - __main__ - Step 6330: {'lr': 0.0004989452345953725, 'samples': 1215360, 'steps': 6329, 'loss/train': 1.8572430610656738}} +11/06/2021 22:08:24 - INFO - __main__ - Step 6337: {'lr': 0.0004989418231331124, 'samples': 1216704, 'steps': 6336, 'loss/train': 2.056525230407715}}} +11/06/2021 22:08:26 - INFO - __main__ - Step 6342: {'lr': 0.0004989393830092705, 'samples': 1217664, 'steps': 6341, 'loss/train': 2.555983781814575}}} +11/06/2021 22:08:28 - INFO - __main__ - Step 6347: {'lr': 0.0004989369400812225, 'samples': 1218624, 'steps': 6346, 'loss/train': 1.2773443460464478}} +11/06/2021 22:08:31 - INFO - __main__ - Step 6351: {'lr': 0.0004989349837197742, 'samples': 1219392, 'steps': 6350, 'loss/train': 1.6861871480941772}} +11/06/2021 22:08:33 - INFO - __main__ - Step 6355: {'lr': 0.0004989330255636656, 'samples': 1220160, 'steps': 6354, 'loss/train': 1.5128992795944214}} +11/06/2021 22:08:34 - INFO - __main__ - Step 6359: {'lr': 0.000498931065612911, 'samples': 1220928, 'steps': 6358, 'loss/train': 1.3788177967071533}}} +11/06/2021 22:08:36 - INFO - __main__ - Step 6363: {'lr': 0.0004989291038675245, 'samples': 1221696, 'steps': 6362, 'loss/train': 2.109246015548706}}} +11/06/2021 22:08:39 - INFO - __main__ - Step 6368: {'lr': 0.0004989266491621117, 'samples': 1222656, 'steps': 6367, 'loss/train': 1.7916598320007324}} +11/06/2021 22:08:41 - INFO - __main__ - Step 6372: {'lr': 0.0004989246833788549, 'samples': 1223424, 'steps': 6371, 'loss/train': 1.6870710849761963}} +11/06/2021 22:08:41 - INFO - __main__ - Step 6372: {'lr': 0.0004989246833788549, 'samples': 1223424, 'steps': 6371, 'loss/train': 1.6870710849761963}} +11/06/2021 22:08:41 - INFO - __main__ - Step 6372: {'lr': 0.0004989246833788549, 'samples': 1223424, 'steps': 6371, 'loss/train': 1.6870710849761963}} +11/06/2021 22:08:46 - INFO - __main__ - Step 6381: {'lr': 0.0004989202538050939, 'samples': 1225152, 'steps': 6380, 'loss/train': 1.969157099723816}}} +11/06/2021 22:08:49 - INFO - __main__ - Step 6387: {'lr': 0.000498917295708727, 'samples': 1226304, 'steps': 6386, 'loss/train': 2.260986328125}816}}} +11/06/2021 22:08:51 - INFO - __main__ - Step 6391: {'lr': 0.0004989153214013135, 'samples': 1227072, 'steps': 6390, 'loss/train': 2.1878926753997803}} +11/06/2021 22:08:51 - INFO - __main__ - Step 6391: {'lr': 0.0004989153214013135, 'samples': 1227072, 'steps': 6390, 'loss/train': 2.1878926753997803}} +11/06/2021 22:08:54 - INFO - __main__ - Step 6398: {'lr': 0.0004989118620452884, 'samples': 1228416, 'steps': 6397, 'loss/train': 1.6816266775131226}} +11/06/2021 22:08:56 - INFO - __main__ - Step 6402: {'lr': 0.0004989098828029836, 'samples': 1229184, 'steps': 6401, 'loss/train': 2.1822431087493896}} +11/06/2021 22:08:59 - INFO - __main__ - Step 6407: {'lr': 0.0004989074062266177, 'samples': 1230144, 'steps': 6406, 'loss/train': 5.536162853240967}}} +11/06/2021 22:09:01 - INFO - __main__ - Step 6411: {'lr': 0.0004989054229467546, 'samples': 1230912, 'steps': 6410, 'loss/train': 1.9058226346969604}} +11/06/2021 22:09:03 - INFO - __main__ - Step 6415: {'lr': 0.0004989034378724443, 'samples': 1231680, 'steps': 6414, 'loss/train': 2.1043949127197266}} +11/06/2021 22:09:04 - INFO - __main__ - Step 6419: {'lr': 0.0004989014510037013, 'samples': 1232448, 'steps': 6418, 'loss/train': 1.0096818208694458}} +11/06/2021 22:09:06 - INFO - __main__ - Step 6423: {'lr': 0.00049889946234054, 'samples': 1233216, 'steps': 6422, 'loss/train': 1.466779351234436}58}} +11/06/2021 22:09:09 - INFO - __main__ - Step 6428: {'lr': 0.0004988969739882091, 'samples': 1234176, 'steps': 6427, 'loss/train': 1.8715691566467285}} +11/06/2021 22:09:09 - INFO - __main__ - Step 6428: {'lr': 0.0004988969739882091, 'samples': 1234176, 'steps': 6427, 'loss/train': 1.8715691566467285}} +11/06/2021 22:09:12 - INFO - __main__ - Step 6433: {'lr': 0.0004988944828321499, 'samples': 1235136, 'steps': 6432, 'loss/train': 1.8814183473587036}} +11/06/2021 22:09:12 - INFO - __main__ - Step 6433: {'lr': 0.0004988944828321499, 'samples': 1235136, 'steps': 6432, 'loss/train': 1.8814183473587036}} +11/06/2021 22:09:16 - INFO - __main__ - Step 6442: {'lr': 0.0004988899916859372, 'samples': 1236864, 'steps': 6441, 'loss/train': 2.750673294067383}}} +11/06/2021 22:09:18 - INFO - __main__ - Step 6446: {'lr': 0.0004988879927051484, 'samples': 1237632, 'steps': 6445, 'loss/train': 1.573569655418396}}} +11/06/2021 22:09:20 - INFO - __main__ - Step 6451: {'lr': 0.0004988854914558994, 'samples': 1238592, 'steps': 6450, 'loss/train': 1.7760518789291382}} +11/06/2021 22:09:20 - INFO - __main__ - Step 6451: {'lr': 0.0004988854914558994, 'samples': 1238592, 'steps': 6450, 'loss/train': 1.7760518789291382}} +11/06/2021 22:09:25 - INFO - __main__ - Step 6459: {'lr': 0.0004988814836256269, 'samples': 1240128, 'steps': 6458, 'loss/train': 1.4734045267105103}} +11/06/2021 22:09:26 - INFO - __main__ - Step 6463: {'lr': 0.0004988794770190717, 'samples': 1240896, 'steps': 6462, 'loss/train': 2.106597661972046}}} +11/06/2021 22:09:29 - INFO - __main__ - Step 6468: {'lr': 0.0004988769662377013, 'samples': 1241856, 'steps': 6467, 'loss/train': 2.2871172428131104}} +11/06/2021 22:09:31 - INFO - __main__ - Step 6472: {'lr': 0.0004988749555940814, 'samples': 1242624, 'steps': 6471, 'loss/train': 1.6348545551300049}} +11/06/2021 22:09:33 - INFO - __main__ - Step 6476: {'lr': 0.0004988729431562339, 'samples': 1243392, 'steps': 6475, 'loss/train': 2.184319496154785}}} +11/06/2021 22:09:35 - INFO - __main__ - Step 6480: {'lr': 0.0004988709289241736, 'samples': 1244160, 'steps': 6479, 'loss/train': 2.1878020763397217}} +11/06/2021 22:09:36 - INFO - __main__ - Step 6484: {'lr': 0.000498868912897915, 'samples': 1244928, 'steps': 6483, 'loss/train': 1.5354762077331543}}} +11/06/2021 22:09:39 - INFO - __main__ - Step 6489: {'lr': 0.0004988663903420222, 'samples': 1245888, 'steps': 6488, 'loss/train': 2.216024398803711}}} +11/06/2021 22:09:39 - INFO - __main__ - Step 6489: {'lr': 0.0004988663903420222, 'samples': 1245888, 'steps': 6488, 'loss/train': 2.216024398803711}}} +11/06/2021 22:09:43 - INFO - __main__ - Step 6497: {'lr': 0.0004988623484215673, 'samples': 1247424, 'steps': 6496, 'loss/train': 0.6462783217430115}} +11/06/2021 22:09:45 - INFO - __main__ - Step 6501: {'lr': 0.0004988603247701276, 'samples': 1248192, 'steps': 6500, 'loss/train': 1.803402066230774}}} +11/06/2021 22:09:46 - INFO - __main__ - Step 6505: {'lr': 0.0004988582993245661, 'samples': 1248960, 'steps': 6504, 'loss/train': 2.119647264480591}}} +11/06/2021 22:09:48 - INFO - __main__ - Step 6509: {'lr': 0.0004988562720848973, 'samples': 1249728, 'steps': 6508, 'loss/train': 2.310293674468994}}} +11/06/2021 22:09:51 - INFO - __main__ - Step 6514: {'lr': 0.0004988537355123699, 'samples': 1250688, 'steps': 6513, 'loss/train': 2.3833720684051514}} +11/06/2021 22:09:53 - INFO - __main__ - Step 6518: {'lr': 0.0004988517042360128, 'samples': 1251456, 'steps': 6517, 'loss/train': 1.9547860622406006}} +11/06/2021 22:09:55 - INFO - __main__ - Step 6522: {'lr': 0.0004988496711655961, 'samples': 1252224, 'steps': 6521, 'loss/train': 1.5848283767700195}} +11/06/2021 22:09:56 - INFO - __main__ - Step 6526: {'lr': 0.0004988476363011341, 'samples': 1252992, 'steps': 6525, 'loss/train': 2.017069101333618}}} +11/06/2021 22:09:58 - INFO - __main__ - Step 6530: {'lr': 0.0004988455996426418, 'samples': 1253760, 'steps': 6529, 'loss/train': 1.9897722005844116}} +11/06/2021 22:10:01 - INFO - __main__ - Step 6535: {'lr': 0.0004988430512966932, 'samples': 1254720, 'steps': 6534, 'loss/train': 2.3683085441589355}} +11/06/2021 22:10:03 - INFO - __main__ - Step 6539: {'lr': 0.000498841010601686, 'samples': 1255488, 'steps': 6538, 'loss/train': 2.037982225418091}5}} +11/06/2021 22:10:05 - INFO - __main__ - Step 6543: {'lr': 0.000498838968112696, 'samples': 1256256, 'steps': 6542, 'loss/train': 1.6090011596679688}}} +11/06/2021 22:10:07 - INFO - __main__ - Step 6547: {'lr': 0.000498836923829738, 'samples': 1257024, 'steps': 6546, 'loss/train': 1.8499354124069214}}} +11/06/2021 22:10:09 - INFO - __main__ - Step 6551: {'lr': 0.0004988348777528267, 'samples': 1257792, 'steps': 6550, 'loss/train': 2.171156883239746}}} +11/06/2021 22:10:11 - INFO - __main__ - Step 6556: {'lr': 0.0004988323176339633, 'samples': 1258752, 'steps': 6555, 'loss/train': 1.467564582824707}}} +11/06/2021 22:10:11 - INFO - __main__ - Step 6556: {'lr': 0.0004988323176339633, 'samples': 1258752, 'steps': 6555, 'loss/train': 1.467564582824707}}} +11/06/2021 22:10:15 - INFO - __main__ - Step 6564: {'lr': 0.0004988282156135539, 'samples': 1260288, 'steps': 6563, 'loss/train': 1.7303180694580078}} +11/06/2021 22:10:17 - INFO - __main__ - Step 6568: {'lr': 0.000498826161912506, 'samples': 1261056, 'steps': 6567, 'loss/train': 1.8563683032989502}}} +11/06/2021 22:10:18 - INFO - __main__ - Step 6572: {'lr': 0.0004988241064175826, 'samples': 1261824, 'steps': 6571, 'loss/train': 2.2202649116516113}} +11/06/2021 22:10:21 - INFO - __main__ - Step 6577: {'lr': 0.0004988215345263132, 'samples': 1262784, 'steps': 6576, 'loss/train': 1.774949550628662}}} +11/06/2021 22:10:21 - INFO - __main__ - Step 6577: {'lr': 0.0004988215345263132, 'samples': 1262784, 'steps': 6576, 'loss/train': 1.774949550628662}}} +11/06/2021 22:10:25 - INFO - __main__ - Step 6585: {'lr': 0.0004988174136703066, 'samples': 1264320, 'steps': 6584, 'loss/train': 1.922788381576538}}} +11/06/2021 22:10:27 - INFO - __main__ - Step 6589: {'lr': 0.0004988153505515771, 'samples': 1265088, 'steps': 6588, 'loss/train': 2.8506147861480713}} +11/06/2021 22:10:29 - INFO - __main__ - Step 6593: {'lr': 0.0004988132856390498, 'samples': 1265856, 'steps': 6592, 'loss/train': 1.3303931951522827}} +11/06/2021 22:10:31 - INFO - __main__ - Step 6597: {'lr': 0.0004988112189327397, 'samples': 1266624, 'steps': 6596, 'loss/train': 2.0449981689453125}} +11/06/2021 22:10:31 - INFO - __main__ - Step 6597: {'lr': 0.0004988112189327397, 'samples': 1266624, 'steps': 6596, 'loss/train': 2.0449981689453125}} +11/06/2021 22:10:35 - INFO - __main__ - Step 6606: {'lr': 0.0004988065622851006, 'samples': 1268352, 'steps': 6605, 'loss/train': 1.55886709690094}5}} +11/06/2021 22:10:37 - INFO - __main__ - Step 6610: {'lr': 0.0004988044897490993, 'samples': 1269120, 'steps': 6609, 'loss/train': 1.8489357233047485}} +11/06/2021 22:10:39 - INFO - __main__ - Step 6614: {'lr': 0.0004988024154193785, 'samples': 1269888, 'steps': 6613, 'loss/train': 2.244598627090454}}} +11/06/2021 22:10:41 - INFO - __main__ - Step 6618: {'lr': 0.0004988003392959533, 'samples': 1270656, 'steps': 6617, 'loss/train': 2.182772397994995}}} +11/06/2021 22:10:43 - INFO - __main__ - Step 6622: {'lr': 0.0004987982613788384, 'samples': 1271424, 'steps': 6621, 'loss/train': 1.808817744255066}}} +11/06/2021 22:10:45 - INFO - __main__ - Step 6626: {'lr': 0.0004987961816680492, 'samples': 1272192, 'steps': 6625, 'loss/train': 1.5684220790863037}} +11/06/2021 22:10:47 - INFO - __main__ - Step 6630: {'lr': 0.0004987941001636004, 'samples': 1272960, 'steps': 6629, 'loss/train': 2.308150291442871}}} +11/06/2021 22:10:48 - INFO - __main__ - Step 6634: {'lr': 0.0004987920168655071, 'samples': 1273728, 'steps': 6633, 'loss/train': 1.4046695232391357}} +11/06/2021 22:10:51 - INFO - __main__ - Step 6639: {'lr': 0.0004987894102206008, 'samples': 1274688, 'steps': 6638, 'loss/train': 1.5049811601638794}} +11/06/2021 22:10:53 - INFO - __main__ - Step 6644: {'lr': 0.0004987868007731778, 'samples': 1275648, 'steps': 6643, 'loss/train': 1.0979185104370117}} +11/06/2021 22:10:53 - INFO - __main__ - Step 6644: {'lr': 0.0004987868007731778, 'samples': 1275648, 'steps': 6643, 'loss/train': 1.0979185104370117}} +11/06/2021 22:10:53 - INFO - __main__ - Step 6644: {'lr': 0.0004987868007731778, 'samples': 1275648, 'steps': 6643, 'loss/train': 1.0979185104370117}} +11/06/2021 22:10:58 - INFO - __main__ - Step 6654: {'lr': 0.000498781573470899, 'samples': 1277568, 'steps': 6653, 'loss/train': 2.209815502166748}7}} +11/06/2021 22:11:01 - INFO - __main__ - Step 6659: {'lr': 0.0004987789556161022, 'samples': 1278528, 'steps': 6658, 'loss/train': 0.2782423198223114}} +11/06/2021 22:11:03 - INFO - __main__ - Step 6663: {'lr': 0.0004987768593145362, 'samples': 1279296, 'steps': 6662, 'loss/train': 1.7183184623718262}} +11/06/2021 22:11:05 - INFO - __main__ - Step 6667: {'lr': 0.0004987747612194499, 'samples': 1280064, 'steps': 6666, 'loss/train': 1.2572715282440186}} +11/06/2021 22:11:07 - INFO - __main__ - Step 6671: {'lr': 0.0004987726613308584, 'samples': 1280832, 'steps': 6670, 'loss/train': 1.7459203004837036}} +11/06/2021 22:11:08 - INFO - __main__ - Step 6675: {'lr': 0.0004987705596487771, 'samples': 1281600, 'steps': 6674, 'loss/train': 1.3550761938095093}} +11/06/2021 22:11:10 - INFO - __main__ - Step 6679: {'lr': 0.000498768456173221, 'samples': 1282368, 'steps': 6678, 'loss/train': 1.7885398864746094}}} +11/06/2021 22:11:13 - INFO - __main__ - Step 6685: {'lr': 0.0004987652975971546, 'samples': 1283520, 'steps': 6684, 'loss/train': 2.027494192123413}}} +11/06/2021 22:11:15 - INFO - __main__ - Step 6689: {'lr': 0.0004987631896379779, 'samples': 1284288, 'steps': 6688, 'loss/train': 1.4638168811798096}} +11/06/2021 22:11:15 - INFO - __main__ - Step 6689: {'lr': 0.0004987631896379779, 'samples': 1284288, 'steps': 6688, 'loss/train': 1.4638168811798096}} +11/06/2021 22:11:19 - INFO - __main__ - Step 6696: {'lr': 0.0004987594963940066, 'samples': 1285632, 'steps': 6695, 'loss/train': 1.7367832660675049}} +11/06/2021 22:11:21 - INFO - __main__ - Step 6700: {'lr': 0.0004987573835029569, 'samples': 1286400, 'steps': 6699, 'loss/train': 2.1391384601593018}} +11/06/2021 22:11:23 - INFO - __main__ - Step 6705: {'lr': 0.0004987547398672061, 'samples': 1287360, 'steps': 6704, 'loss/train': 1.8196769952774048}} +11/06/2021 22:11:25 - INFO - __main__ - Step 6710: {'lr': 0.000498752093429329, 'samples': 1288320, 'steps': 6709, 'loss/train': 1.8113231658935547}}} +11/06/2021 22:11:27 - INFO - __main__ - Step 6714: {'lr': 0.0004987499742615167, 'samples': 1289088, 'steps': 6713, 'loss/train': 1.8710038661956787}} +11/06/2021 22:11:27 - INFO - __main__ - Step 6714: {'lr': 0.0004987499742615167, 'samples': 1289088, 'steps': 6713, 'loss/train': 1.8710038661956787}} +11/06/2021 22:11:31 - INFO - __main__ - Step 6721: {'lr': 0.0004987462614026624, 'samples': 1290432, 'steps': 6720, 'loss/train': 1.4481638669967651}} +11/06/2021 22:11:33 - INFO - __main__ - Step 6725: {'lr': 0.0004987441373032393, 'samples': 1291200, 'steps': 6724, 'loss/train': 1.264276385307312}}} +11/06/2021 22:11:35 - INFO - __main__ - Step 6730: {'lr': 0.000498741479657156, 'samples': 1292160, 'steps': 6729, 'loss/train': 2.122650146484375}}}} +11/06/2021 22:11:38 - INFO - __main__ - Step 6735: {'lr': 0.0004987388192090959, 'samples': 1293120, 'steps': 6734, 'loss/train': 1.5254181623458862}} +11/06/2021 22:11:38 - INFO - __main__ - Step 6735: {'lr': 0.0004987388192090959, 'samples': 1293120, 'steps': 6734, 'loss/train': 1.5254181623458862}} +11/06/2021 22:11:41 - INFO - __main__ - Step 6742: {'lr': 0.0004987350898745477, 'samples': 1294464, 'steps': 6741, 'loss/train': 1.4959521293640137}} +11/06/2021 22:11:43 - INFO - __main__ - Step 6747: {'lr': 0.0004987324227018657, 'samples': 1295424, 'steps': 6746, 'loss/train': 2.1900782585144043}} +11/06/2021 22:11:45 - INFO - __main__ - Step 6751: {'lr': 0.0004987302869463686, 'samples': 1296192, 'steps': 6750, 'loss/train': 1.5255533456802368}} +11/06/2021 22:11:48 - INFO - __main__ - Step 6756: {'lr': 0.0004987276147303337, 'samples': 1297152, 'steps': 6755, 'loss/train': 1.5767613649368286}} +11/06/2021 22:11:48 - INFO - __main__ - Step 6756: {'lr': 0.0004987276147303337, 'samples': 1297152, 'steps': 6755, 'loss/train': 1.5767613649368286}} +11/06/2021 22:11:51 - INFO - __main__ - Step 6763: {'lr': 0.0004987238689208327, 'samples': 1298496, 'steps': 6762, 'loss/train': 1.8828072547912598}} +11/06/2021 22:11:53 - INFO - __main__ - Step 6767: {'lr': 0.0004987217259926904, 'samples': 1299264, 'steps': 6766, 'loss/train': 0.23178565502166748} +11/06/2021 22:11:56 - INFO - __main__ - Step 6772: {'lr': 0.0004987190448109354, 'samples': 1300224, 'steps': 6771, 'loss/train': 2.2244198322296143}} +11/06/2021 22:11:56 - INFO - __main__ - Step 6772: {'lr': 0.0004987190448109354, 'samples': 1300224, 'steps': 6771, 'loss/train': 2.2244198322296143}} +11/06/2021 22:11:59 - INFO - __main__ - Step 6779: {'lr': 0.0004987152864495887, 'samples': 1301568, 'steps': 6778, 'loss/train': 2.1859946250915527}} +11/06/2021 22:12:01 - INFO - __main__ - Step 6784: {'lr': 0.0004987125985437468, 'samples': 1302528, 'steps': 6783, 'loss/train': 2.15081524848938}7}} +11/06/2021 22:12:03 - INFO - __main__ - Step 6788: {'lr': 0.0004987104462018828, 'samples': 1303296, 'steps': 6787, 'loss/train': 1.6238676309585571}} +11/06/2021 22:12:06 - INFO - __main__ - Step 6793: {'lr': 0.0004987077532530899, 'samples': 1304256, 'steps': 6792, 'loss/train': 1.743523120880127}}} +11/06/2021 22:12:08 - INFO - __main__ - Step 6797: {'lr': 0.0004987055968769045, 'samples': 1305024, 'steps': 6796, 'loss/train': 1.779247522354126}}} +11/06/2021 22:12:08 - INFO - __main__ - Step 6797: {'lr': 0.0004987055968769045, 'samples': 1305024, 'steps': 6796, 'loss/train': 1.779247522354126}}} +11/06/2021 22:12:11 - INFO - __main__ - Step 6804: {'lr': 0.0004987018189041675, 'samples': 1306368, 'steps': 6803, 'loss/train': 1.7351499795913696}} +11/06/2021 22:12:13 - INFO - __main__ - Step 6808: {'lr': 0.0004986996575972517, 'samples': 1307136, 'steps': 6807, 'loss/train': 0.7521131038665771}} +11/06/2021 22:12:13 - INFO - __main__ - Step 6808: {'lr': 0.0004986996575972517, 'samples': 1307136, 'steps': 6807, 'loss/train': 0.7521131038665771}} +11/06/2021 22:12:13 - INFO - __main__ - Step 6808: {'lr': 0.0004986996575972517, 'samples': 1307136, 'steps': 6807, 'loss/train': 0.7521131038665771}} +11/06/2021 22:12:19 - INFO - __main__ - Step 6820: {'lr': 0.0004986931629187848, 'samples': 1309440, 'steps': 6819, 'loss/train': 2.2714736461639404}} +11/06/2021 22:12:21 - INFO - __main__ - Step 6824: {'lr': 0.0004986909944401082, 'samples': 1310208, 'steps': 6823, 'loss/train': 1.4807871580123901}} +11/06/2021 22:12:24 - INFO - __main__ - Step 6829: {'lr': 0.0004986882813204967, 'samples': 1311168, 'steps': 6828, 'loss/train': 2.6850411891937256}} +11/06/2021 22:12:24 - INFO - __main__ - Step 6829: {'lr': 0.0004986882813204967, 'samples': 1311168, 'steps': 6828, 'loss/train': 2.6850411891937256}} +11/06/2021 22:12:24 - INFO - __main__ - Step 6829: {'lr': 0.0004986882813204967, 'samples': 1311168, 'steps': 6828, 'loss/train': 2.6850411891937256}} +11/06/2021 22:12:29 - INFO - __main__ - Step 6839: {'lr': 0.0004986828466771718, 'samples': 1313088, 'steps': 6838, 'loss/train': 2.1545591354370117}} +11/06/2021 22:12:32 - INFO - __main__ - Step 6845: {'lr': 0.0004986795805126339, 'samples': 1314240, 'steps': 6844, 'loss/train': 1.878450632095337}}} +11/06/2021 22:12:34 - INFO - __main__ - Step 6849: {'lr': 0.0004986774008285816, 'samples': 1315008, 'steps': 6848, 'loss/train': 1.9744795560836792}} +11/06/2021 22:12:34 - INFO - __main__ - Step 6849: {'lr': 0.0004986774008285816, 'samples': 1315008, 'steps': 6848, 'loss/train': 1.9744795560836792}} +11/06/2021 22:12:37 - INFO - __main__ - Step 6856: {'lr': 0.000498673582067567, 'samples': 1316352, 'steps': 6855, 'loss/train': 1.685018539428711}2}} +11/06/2021 22:12:40 - INFO - __main__ - Step 6861: {'lr': 0.0004986708510196688, 'samples': 1317312, 'steps': 6860, 'loss/train': 1.852432131767273}}} +11/06/2021 22:12:42 - INFO - __main__ - Step 6866: {'lr': 0.0004986681171705893, 'samples': 1318272, 'steps': 6865, 'loss/train': 1.9213021993637085}} +11/06/2021 22:12:44 - INFO - __main__ - Step 6870: {'lr': 0.000498665928074496, 'samples': 1319040, 'steps': 6869, 'loss/train': 1.9043452739715576}}} +11/06/2021 22:12:44 - INFO - __main__ - Step 6870: {'lr': 0.000498665928074496, 'samples': 1319040, 'steps': 6869, 'loss/train': 1.9043452739715576}}} +11/06/2021 22:12:47 - INFO - __main__ - Step 6876: {'lr': 0.0004986626410690099, 'samples': 1320192, 'steps': 6875, 'loss/train': 1.3328086137771606}} +11/06/2021 22:12:49 - INFO - __main__ - Step 6881: {'lr': 0.0004986598988165718, 'samples': 1321152, 'steps': 6880, 'loss/train': 2.5729262828826904}} +11/06/2021 22:12:49 - INFO - __main__ - Step 6881: {'lr': 0.0004986598988165718, 'samples': 1321152, 'steps': 6880, 'loss/train': 2.5729262828826904}} +11/06/2021 22:12:53 - INFO - __main__ - Step 6889: {'lr': 0.0004986555053864833, 'samples': 1322688, 'steps': 6888, 'loss/train': 1.7372727394104004}} +11/06/2021 22:12:56 - INFO - __main__ - Step 6893: {'lr': 0.000498653305982463, 'samples': 1323456, 'steps': 6892, 'loss/train': 1.350880742073059}4}} +11/06/2021 22:12:57 - INFO - __main__ - Step 6897: {'lr': 0.0004986511047858134, 'samples': 1324224, 'steps': 6896, 'loss/train': 2.2133257389068604}} +11/06/2021 22:12:59 - INFO - __main__ - Step 6902: {'lr': 0.0004986483507691403, 'samples': 1325184, 'steps': 6901, 'loss/train': 1.9309344291687012}} +11/06/2021 22:13:02 - INFO - __main__ - Step 6907: {'lr': 0.0004986455939515395, 'samples': 1326144, 'steps': 6906, 'loss/train': 1.7874330282211304}} +11/06/2021 22:13:02 - INFO - __main__ - Step 6907: {'lr': 0.0004986455939515395, 'samples': 1326144, 'steps': 6906, 'loss/train': 1.7874330282211304}} +11/06/2021 22:13:05 - INFO - __main__ - Step 6914: {'lr': 0.0004986417297013987, 'samples': 1327488, 'steps': 6913, 'loss/train': 1.6202863454818726}} +11/06/2021 22:13:07 - INFO - __main__ - Step 6918: {'lr': 0.0004986395190937048, 'samples': 1328256, 'steps': 6917, 'loss/train': 1.7865066528320312}} +11/06/2021 22:13:09 - INFO - __main__ - Step 6922: {'lr': 0.000498637306693481, 'samples': 1329024, 'steps': 6921, 'loss/train': 1.9036977291107178}}} +11/06/2021 22:13:11 - INFO - __main__ - Step 6927: {'lr': 0.00049863453867248, 'samples': 1329984, 'steps': 6926, 'loss/train': 1.5846327543258667}}}} +11/06/2021 22:13:14 - INFO - __main__ - Step 6932: {'lr': 0.0004986317678507069, 'samples': 1330944, 'steps': 6931, 'loss/train': 1.773486852645874}}} +11/06/2021 22:13:14 - INFO - __main__ - Step 6932: {'lr': 0.0004986317678507069, 'samples': 1330944, 'steps': 6931, 'loss/train': 1.773486852645874}}} +11/06/2021 22:13:18 - INFO - __main__ - Step 6939: {'lr': 0.0004986278839949866, 'samples': 1332288, 'steps': 6938, 'loss/train': 2.0607035160064697}} +11/06/2021 22:13:19 - INFO - __main__ - Step 6943: {'lr': 0.0004986256621842417, 'samples': 1333056, 'steps': 6942, 'loss/train': 1.3075493574142456}} +11/06/2021 22:13:21 - INFO - __main__ - Step 6947: {'lr': 0.0004986234385810668, 'samples': 1333824, 'steps': 6946, 'loss/train': 1.9208937883377075}} +11/06/2021 22:13:24 - INFO - __main__ - Step 6952: {'lr': 0.0004986206565565173, 'samples': 1334784, 'steps': 6951, 'loss/train': 1.6181141138076782}} +11/06/2021 22:13:26 - INFO - __main__ - Step 6956: {'lr': 0.000498618428920433, 'samples': 1335552, 'steps': 6955, 'loss/train': 1.4519563913345337}}} +11/06/2021 22:13:28 - INFO - __main__ - Step 6960: {'lr': 0.0004986161994919706, 'samples': 1336320, 'steps': 6959, 'loss/train': 1.547726035118103}}} +11/06/2021 22:13:29 - INFO - __main__ - Step 6964: {'lr': 0.0004986139682711463, 'samples': 1337088, 'steps': 6963, 'loss/train': 2.060143232345581}}} +11/06/2021 22:13:32 - INFO - __main__ - Step 6968: {'lr': 0.000498611735257976, 'samples': 1337856, 'steps': 6967, 'loss/train': 1.8004080057144165}}} +11/06/2021 22:13:34 - INFO - __main__ - Step 6972: {'lr': 0.000498609500452476, 'samples': 1338624, 'steps': 6971, 'loss/train': 1.8543205261230469}}} +11/06/2021 22:13:36 - INFO - __main__ - Step 6976: {'lr': 0.0004986072638546623, 'samples': 1339392, 'steps': 6975, 'loss/train': 1.7745708227157593}} +11/06/2021 22:13:36 - INFO - __main__ - Step 6976: {'lr': 0.0004986072638546623, 'samples': 1339392, 'steps': 6975, 'loss/train': 1.7745708227157593}} +11/06/2021 22:13:36 - INFO - __main__ - Step 6976: {'lr': 0.0004986072638546623, 'samples': 1339392, 'steps': 6975, 'loss/train': 1.7745708227157593}} +11/06/2021 22:13:41 - INFO - __main__ - Step 6986: {'lr': 0.0004986016645188615, 'samples': 1341312, 'steps': 6985, 'loss/train': 1.4657028913497925}} +11/06/2021 22:13:44 - INFO - __main__ - Step 6991: {'lr': 0.0004985988606503426, 'samples': 1342272, 'steps': 6990, 'loss/train': 1.556723713874817}}} +11/06/2021 22:13:46 - INFO - __main__ - Step 6996: {'lr': 0.0004985960539814534, 'samples': 1343232, 'steps': 6995, 'loss/train': 1.901774287223816}}} +11/06/2021 22:13:46 - INFO - __main__ - Step 6996: {'lr': 0.0004985960539814534, 'samples': 1343232, 'steps': 6995, 'loss/train': 1.901774287223816}}} +11/06/2021 22:13:49 - INFO - __main__ - Step 7003: {'lr': 0.0004985921199404467, 'samples': 1344576, 'steps': 7002, 'loss/train': 1.5738434791564941}} +11/06/2021 22:13:51 - INFO - __main__ - Step 7007: {'lr': 0.0004985898694527498, 'samples': 1345344, 'steps': 7006, 'loss/train': 1.9892717599868774}} +11/06/2021 22:13:54 - INFO - __main__ - Step 7012: {'lr': 0.0004985870538228884, 'samples': 1346304, 'steps': 7011, 'loss/train': 1.831001877784729}}} +11/06/2021 22:13:54 - INFO - __main__ - Step 7012: {'lr': 0.0004985870538228884, 'samples': 1346304, 'steps': 7011, 'loss/train': 1.831001877784729}}} +11/06/2021 22:13:58 - INFO - __main__ - Step 7020: {'lr': 0.0004985825429906299, 'samples': 1347840, 'steps': 7019, 'loss/train': 1.8477237224578857}} +11/06/2021 22:13:59 - INFO - __main__ - Step 7024: {'lr': 0.0004985802848863135, 'samples': 1348608, 'steps': 7023, 'loss/train': 2.0270166397094727}} +11/06/2021 22:14:02 - INFO - __main__ - Step 7028: {'lr': 0.0004985780249898941, 'samples': 1349376, 'steps': 7027, 'loss/train': 1.8955899477005005}} +11/06/2021 22:14:04 - INFO - __main__ - Step 7033: {'lr': 0.0004985751975992497, 'samples': 1350336, 'steps': 7032, 'loss/train': 2.039046287536621}}} +11/06/2021 22:14:06 - INFO - __main__ - Step 7037: {'lr': 0.000498572933670658, 'samples': 1351104, 'steps': 7036, 'loss/train': 1.8642250299453735}}} +11/06/2021 22:14:08 - INFO - __main__ - Step 7041: {'lr': 0.0004985706679500163, 'samples': 1351872, 'steps': 7040, 'loss/train': 2.2261483669281006}} +11/06/2021 22:14:08 - INFO - __main__ - Step 7041: {'lr': 0.0004985706679500163, 'samples': 1351872, 'steps': 7040, 'loss/train': 2.2261483669281006}} +11/06/2021 22:14:11 - INFO - __main__ - Step 7048: {'lr': 0.000498566698626822, 'samples': 1353216, 'steps': 7047, 'loss/train': 2.0857248306274414}}} +11/06/2021 22:14:14 - INFO - __main__ - Step 7053: {'lr': 0.0004985638600359542, 'samples': 1354176, 'steps': 7052, 'loss/train': 2.2024543285369873}} +11/06/2021 22:14:16 - INFO - __main__ - Step 7058: {'lr': 0.0004985610186451104, 'samples': 1355136, 'steps': 7057, 'loss/train': 2.400442123413086}}} +11/06/2021 22:14:18 - INFO - __main__ - Step 7062: {'lr': 0.0004985587435164742, 'samples': 1355904, 'steps': 7061, 'loss/train': 2.2818222045898438}} +11/06/2021 22:14:18 - INFO - __main__ - Step 7062: {'lr': 0.0004985587435164742, 'samples': 1355904, 'steps': 7061, 'loss/train': 2.2818222045898438}} +11/06/2021 22:14:21 - INFO - __main__ - Step 7069: {'lr': 0.0004985547577294963, 'samples': 1357248, 'steps': 7068, 'loss/train': 1.4728955030441284}} +11/06/2021 22:14:24 - INFO - __main__ - Step 7074: {'lr': 0.0004985519073789447, 'samples': 1358208, 'steps': 7073, 'loss/train': 2.0647716522216797}} +11/06/2021 22:14:24 - INFO - __main__ - Step 7074: {'lr': 0.0004985519073789447, 'samples': 1358208, 'steps': 7073, 'loss/train': 2.0647716522216797}} +11/06/2021 22:14:27 - INFO - __main__ - Step 7081: {'lr': 0.000498547912184446, 'samples': 1359552, 'steps': 7080, 'loss/train': 2.0644752979278564}}} +11/06/2021 22:14:30 - INFO - __main__ - Step 7085: {'lr': 0.0004985456267523346, 'samples': 1360320, 'steps': 7084, 'loss/train': 1.65984308719635}}}} +11/06/2021 22:14:32 - INFO - __main__ - Step 7090: {'lr': 0.0004985427674424038, 'samples': 1361280, 'steps': 7089, 'loss/train': 1.8997712135314941}} +11/06/2021 22:14:32 - INFO - __main__ - Step 7090: {'lr': 0.0004985427674424038, 'samples': 1361280, 'steps': 7089, 'loss/train': 1.8997712135314941}} +11/06/2021 22:14:32 - INFO - __main__ - Step 7090: {'lr': 0.0004985427674424038, 'samples': 1361280, 'steps': 7089, 'loss/train': 1.8997712135314941}} +11/06/2021 22:14:38 - INFO - __main__ - Step 7101: {'lr': 0.0004985364671055223, 'samples': 1363392, 'steps': 7100, 'loss/train': 2.0017964839935303}} +11/06/2021 22:14:40 - INFO - __main__ - Step 7106: {'lr': 0.000498533598836542, 'samples': 1364352, 'steps': 7105, 'loss/train': 1.2057009935379028}}} +11/06/2021 22:14:42 - INFO - __main__ - Step 7110: {'lr': 0.0004985313022056191, 'samples': 1365120, 'steps': 7109, 'loss/train': 1.8806291818618774}} +11/06/2021 22:14:44 - INFO - __main__ - Step 7114: {'lr': 0.0004985290037829462, 'samples': 1365888, 'steps': 7113, 'loss/train': 3.7923812866210938}} +11/06/2021 22:14:46 - INFO - __main__ - Step 7118: {'lr': 0.00049852670356854, 'samples': 1366656, 'steps': 7117, 'loss/train': 1.7581599950790405}8}} +11/06/2021 22:14:48 - INFO - __main__ - Step 7122: {'lr': 0.000498524401562417, 'samples': 1367424, 'steps': 7121, 'loss/train': 1.7350369691848755}}} +11/06/2021 22:14:50 - INFO - __main__ - Step 7127: {'lr': 0.0004985215215351869, 'samples': 1368384, 'steps': 7126, 'loss/train': 1.9587048292160034}} +11/06/2021 22:14:50 - INFO - __main__ - Step 7127: {'lr': 0.0004985215215351869, 'samples': 1368384, 'steps': 7126, 'loss/train': 1.9587048292160034}} +11/06/2021 22:14:53 - INFO - __main__ - Step 7134: {'lr': 0.0004985174847939135, 'samples': 1369728, 'steps': 7133, 'loss/train': 2.039775848388672}}} +11/06/2021 22:14:56 - INFO - __main__ - Step 7138: {'lr': 0.0004985151756210897, 'samples': 1370496, 'steps': 7137, 'loss/train': 1.8486833572387695}} +11/06/2021 22:14:58 - INFO - __main__ - Step 7143: {'lr': 0.0004985122866355768, 'samples': 1371456, 'steps': 7142, 'loss/train': 2.1116602420806885}} +11/06/2021 22:15:00 - INFO - __main__ - Step 7148: {'lr': 0.0004985093948506689, 'samples': 1372416, 'steps': 7147, 'loss/train': 1.5859280824661255}} +11/06/2021 22:15:03 - INFO - __main__ - Step 7152: {'lr': 0.0004985070794072002, 'samples': 1373184, 'steps': 7151, 'loss/train': 2.0557656288146973}} +11/06/2021 22:15:05 - INFO - __main__ - Step 7156: {'lr': 0.0004985047621721561, 'samples': 1373952, 'steps': 7155, 'loss/train': 0.8238686323165894}} +11/06/2021 22:15:06 - INFO - __main__ - Step 7160: {'lr': 0.0004985024431455534, 'samples': 1374720, 'steps': 7159, 'loss/train': 1.8155590295791626}} +11/06/2021 22:15:08 - INFO - __main__ - Step 7164: {'lr': 0.0004985001223274089, 'samples': 1375488, 'steps': 7163, 'loss/train': 2.357848644256592}}} +11/06/2021 22:15:10 - INFO - __main__ - Step 7169: {'lr': 0.000498497218785398, 'samples': 1376448, 'steps': 7168, 'loss/train': 1.955859899520874}}}} +11/06/2021 22:15:10 - INFO - __main__ - Step 7169: {'lr': 0.000498497218785398, 'samples': 1376448, 'steps': 7168, 'loss/train': 1.955859899520874}}}} +11/06/2021 22:15:10 - INFO - __main__ - Step 7169: {'lr': 0.000498497218785398, 'samples': 1376448, 'steps': 7168, 'loss/train': 1.955859899520874}}}} +11/06/2021 22:15:16 - INFO - __main__ - Step 7179: {'lr': 0.000498491403303733, 'samples': 1378368, 'steps': 7178, 'loss/train': 2.4547572135925293}}} +11/06/2021 22:15:18 - INFO - __main__ - Step 7185: {'lr': 0.0004984879086403304, 'samples': 1379520, 'steps': 7184, 'loss/train': 2.017399311065674}}} +11/06/2021 22:15:21 - INFO - __main__ - Step 7189: {'lr': 0.000498485576625429, 'samples': 1380288, 'steps': 7188, 'loss/train': 1.9039487838745117}}} +11/06/2021 22:15:21 - INFO - __main__ - Step 7189: {'lr': 0.000498485576625429, 'samples': 1380288, 'steps': 7188, 'loss/train': 1.9039487838745117}}} +11/06/2021 22:15:24 - INFO - __main__ - Step 7196: {'lr': 0.0004984814912887563, 'samples': 1381632, 'steps': 7195, 'loss/train': 2.1821253299713135}} +11/06/2021 22:15:26 - INFO - __main__ - Step 7201: {'lr': 0.0004984785698322699, 'samples': 1382592, 'steps': 7200, 'loss/train': 1.3614236116409302}} +11/06/2021 22:15:29 - INFO - __main__ - Step 7206: {'lr': 0.0004984756455767684, 'samples': 1383552, 'steps': 7205, 'loss/train': 1.8581416606903076}} +11/06/2021 22:15:31 - INFO - __main__ - Step 7210: {'lr': 0.0004984733041570983, 'samples': 1384320, 'steps': 7209, 'loss/train': 1.8552770614624023}} +11/06/2021 22:15:31 - INFO - __main__ - Step 7210: {'lr': 0.0004984733041570983, 'samples': 1384320, 'steps': 7209, 'loss/train': 1.8552770614624023}} +11/06/2021 22:15:34 - INFO - __main__ - Step 7217: {'lr': 0.0004984692023622938, 'samples': 1385664, 'steps': 7216, 'loss/train': 2.0930893421173096}} +11/06/2021 22:15:36 - INFO - __main__ - Step 7222: {'lr': 0.000498466269150165, 'samples': 1386624, 'steps': 7221, 'loss/train': 1.4030883312225342}}} +11/06/2021 22:15:39 - INFO - __main__ - Step 7227: {'lr': 0.0004984633331391596, 'samples': 1387584, 'steps': 7226, 'loss/train': 1.6768375635147095}} +11/06/2021 22:15:39 - INFO - __main__ - Step 7227: {'lr': 0.0004984633331391596, 'samples': 1387584, 'steps': 7226, 'loss/train': 1.6768375635147095}} +11/06/2021 22:15:42 - INFO - __main__ - Step 7234: {'lr': 0.0004984592180217022, 'samples': 1388928, 'steps': 7233, 'loss/train': 1.602423906326294}}} +11/06/2021 22:15:44 - INFO - __main__ - Step 7238: {'lr': 0.0004984568640630648, 'samples': 1389696, 'steps': 7237, 'loss/train': 1.3969769477844238}} +11/06/2021 22:15:46 - INFO - __main__ - Step 7243: {'lr': 0.0004984539190958765, 'samples': 1390656, 'steps': 7242, 'loss/train': 2.117086887359619}}} +11/06/2021 22:15:46 - INFO - __main__ - Step 7243: {'lr': 0.0004984539190958765, 'samples': 1390656, 'steps': 7242, 'loss/train': 2.117086887359619}}} +11/06/2021 22:15:50 - INFO - __main__ - Step 7251: {'lr': 0.0004984492013270147, 'samples': 1392192, 'steps': 7250, 'loss/train': 1.9997104406356812}} +11/06/2021 22:15:52 - INFO - __main__ - Step 7255: {'lr': 0.0004984468397558384, 'samples': 1392960, 'steps': 7254, 'loss/train': 1.3238756656646729}} +11/06/2021 22:15:54 - INFO - __main__ - Step 7259: {'lr': 0.000498444476393521, 'samples': 1393728, 'steps': 7258, 'loss/train': 2.349273920059204}9}} +11/06/2021 22:15:56 - INFO - __main__ - Step 7264: {'lr': 0.0004984415196718582, 'samples': 1394688, 'steps': 7263, 'loss/train': 1.5477303266525269}} +11/06/2021 22:15:59 - INFO - __main__ - Step 7268: {'lr': 0.0004984391522795359, 'samples': 1395456, 'steps': 7267, 'loss/train': 1.868264079093933}}} +11/06/2021 22:16:01 - INFO - __main__ - Step 7272: {'lr': 0.0004984367830961281, 'samples': 1396224, 'steps': 7271, 'loss/train': 2.167809247970581}}} +11/06/2021 22:16:01 - INFO - __main__ - Step 7272: {'lr': 0.0004984367830961281, 'samples': 1396224, 'steps': 7271, 'loss/train': 2.167809247970581}}} +11/06/2021 22:16:04 - INFO - __main__ - Step 7279: {'lr': 0.000498432632715416, 'samples': 1397568, 'steps': 7278, 'loss/train': 0.6851865649223328}}} +11/06/2021 22:16:07 - INFO - __main__ - Step 7285: {'lr': 0.0004984290708805743, 'samples': 1398720, 'steps': 7284, 'loss/train': 1.7015665769577026}} +11/06/2021 22:16:09 - INFO - __main__ - Step 7289: {'lr': 0.0004984266940852434, 'samples': 1399488, 'steps': 7288, 'loss/train': 2.0083210468292236}} +11/06/2021 22:16:11 - INFO - __main__ - Step 7293: {'lr': 0.0004984243154989168, 'samples': 1400256, 'steps': 7292, 'loss/train': 1.5568764209747314}} +11/06/2021 22:16:12 - INFO - __main__ - Step 7297: {'lr': 0.0004984219351216116, 'samples': 1401024, 'steps': 7296, 'loss/train': 2.4018189907073975}} +11/06/2021 22:16:14 - INFO - __main__ - Step 7301: {'lr': 0.0004984195529533451, 'samples': 1401792, 'steps': 7300, 'loss/train': 1.912482500076294}}} +11/06/2021 22:16:17 - INFO - __main__ - Step 7306: {'lr': 0.0004984165727244984, 'samples': 1402752, 'steps': 7305, 'loss/train': 1.6583056449890137}} +11/06/2021 22:16:19 - INFO - __main__ - Step 7310: {'lr': 0.0004984141865266312, 'samples': 1403520, 'steps': 7309, 'loss/train': 0.43410855531692505} +11/06/2021 22:16:21 - INFO - __main__ - Step 7314: {'lr': 0.0004984117985378586, 'samples': 1404288, 'steps': 7313, 'loss/train': 2.5833494663238525}} +11/06/2021 22:16:22 - INFO - __main__ - Step 7318: {'lr': 0.0004984094087581975, 'samples': 1405056, 'steps': 7317, 'loss/train': 1.7780122756958008}} +11/06/2021 22:16:24 - INFO - __main__ - Step 7322: {'lr': 0.0004984070171876653, 'samples': 1405824, 'steps': 7321, 'loss/train': 2.0687177181243896}} +11/06/2021 22:16:27 - INFO - __main__ - Step 7327: {'lr': 0.0004984040252061137, 'samples': 1406784, 'steps': 7326, 'loss/train': 2.036705255508423}}} +11/06/2021 22:16:29 - INFO - __main__ - Step 7331: {'lr': 0.0004984016296061846, 'samples': 1407552, 'steps': 7330, 'loss/train': 1.4878357648849487}} +11/06/2021 22:16:29 - INFO - __main__ - Step 7331: {'lr': 0.0004984016296061846, 'samples': 1407552, 'steps': 7330, 'loss/train': 1.4878357648849487}} +11/06/2021 22:16:32 - INFO - __main__ - Step 7338: {'lr': 0.0004983974329971702, 'samples': 1408896, 'steps': 7337, 'loss/train': 1.8037465810775757}} +11/06/2021 22:16:34 - INFO - __main__ - Step 7343: {'lr': 0.0004983944320615757, 'samples': 1409856, 'steps': 7342, 'loss/train': 2.154550552368164}}} +11/06/2021 22:16:36 - INFO - __main__ - Step 7347: {'lr': 0.00049839202929849, 'samples': 1410624, 'steps': 7346, 'loss/train': 2.132795572280884}4}}} +11/06/2021 22:16:39 - INFO - __main__ - Step 7352: {'lr': 0.0004983890233263986, 'samples': 1411584, 'steps': 7351, 'loss/train': 1.8521647453308105}} +11/06/2021 22:16:41 - INFO - __main__ - Step 7356: {'lr': 0.0004983866165341592, 'samples': 1412352, 'steps': 7355, 'loss/train': 2.184023380279541}}} +11/06/2021 22:16:43 - INFO - __main__ - Step 7360: {'lr': 0.0004983842079512128, 'samples': 1413120, 'steps': 7359, 'loss/train': 1.5754534006118774}} +11/06/2021 22:16:44 - INFO - __main__ - Step 7364: {'lr': 0.0004983817975775771, 'samples': 1413888, 'steps': 7363, 'loss/train': 1.666754126548767}}} +11/06/2021 22:16:47 - INFO - __main__ - Step 7368: {'lr': 0.0004983793854132693, 'samples': 1414656, 'steps': 7367, 'loss/train': 1.803916335105896}}} +11/06/2021 22:16:49 - INFO - __main__ - Step 7373: {'lr': 0.0004983763676897784, 'samples': 1415616, 'steps': 7372, 'loss/train': 1.749665379524231}}} +11/06/2021 22:16:51 - INFO - __main__ - Step 7377: {'lr': 0.000498373951496522, 'samples': 1416384, 'steps': 7376, 'loss/train': 2.2691292762756348}}} +11/06/2021 22:16:53 - INFO - __main__ - Step 7381: {'lr': 0.00049837153351265, 'samples': 1417152, 'steps': 7380, 'loss/train': 1.6483396291732788}}}} +11/06/2021 22:16:54 - INFO - __main__ - Step 7385: {'lr': 0.00049836911373818, 'samples': 1417920, 'steps': 7384, 'loss/train': 1.690798044204712}}}}} +11/06/2021 22:16:56 - INFO - __main__ - Step 7389: {'lr': 0.0004983666921731293, 'samples': 1418688, 'steps': 7388, 'loss/train': 1.6616744995117188}} +11/06/2021 22:16:59 - INFO - __main__ - Step 7394: {'lr': 0.0004983636626988386, 'samples': 1419648, 'steps': 7393, 'loss/train': 2.0506041049957275}} +11/06/2021 22:17:01 - INFO - __main__ - Step 7398: {'lr': 0.0004983612371050453, 'samples': 1420416, 'steps': 7397, 'loss/train': 1.7991613149642944}} +11/06/2021 22:17:03 - INFO - __main__ - Step 7402: {'lr': 0.0004983588097207283, 'samples': 1421184, 'steps': 7401, 'loss/train': 1.678063988685608}}} +11/06/2021 22:17:05 - INFO - __main__ - Step 7406: {'lr': 0.0004983563805459048, 'samples': 1421952, 'steps': 7405, 'loss/train': 1.7848727703094482}} +11/06/2021 22:17:07 - INFO - __main__ - Step 7410: {'lr': 0.0004983539495805925, 'samples': 1422720, 'steps': 7409, 'loss/train': 0.8858946561813354}} +11/06/2021 22:17:09 - INFO - __main__ - Step 7415: {'lr': 0.0004983509083561038, 'samples': 1423680, 'steps': 7414, 'loss/train': 2.069981813430786}}} +11/06/2021 22:17:09 - INFO - __main__ - Step 7415: {'lr': 0.0004983509083561038, 'samples': 1423680, 'steps': 7414, 'loss/train': 2.069981813430786}}} +11/06/2021 22:17:13 - INFO - __main__ - Step 7422: {'lr': 0.0004983466459418978, 'samples': 1425024, 'steps': 7421, 'loss/train': 2.4349045753479004}} +11/06/2021 22:17:14 - INFO - __main__ - Step 7426: {'lr': 0.0004983442078148056, 'samples': 1425792, 'steps': 7425, 'loss/train': 1.7043726444244385}} +11/06/2021 22:17:16 - INFO - __main__ - Step 7430: {'lr': 0.0004983417678973123, 'samples': 1426560, 'steps': 7429, 'loss/train': 2.2200920581817627}} +11/06/2021 22:17:19 - INFO - __main__ - Step 7435: {'lr': 0.0004983387154827208, 'samples': 1427520, 'steps': 7434, 'loss/train': 1.69056236743927}7}} +11/06/2021 22:17:19 - INFO - __main__ - Step 7435: {'lr': 0.0004983387154827208, 'samples': 1427520, 'steps': 7434, 'loss/train': 1.69056236743927}7}} +11/06/2021 22:17:23 - INFO - __main__ - Step 7443: {'lr': 0.0004983338258007139, 'samples': 1429056, 'steps': 7442, 'loss/train': 1.3787864446640015}} +11/06/2021 22:17:25 - INFO - __main__ - Step 7447: {'lr': 0.0004983313782742124, 'samples': 1429824, 'steps': 7446, 'loss/train': 1.3778132200241089}} +11/06/2021 22:17:27 - INFO - __main__ - Step 7451: {'lr': 0.0004983289289574022, 'samples': 1430592, 'steps': 7450, 'loss/train': 1.7557963132858276}} +11/06/2021 22:17:29 - INFO - __main__ - Step 7456: {'lr': 0.0004983258647937949, 'samples': 1431552, 'steps': 7455, 'loss/train': 2.1020658016204834}} +11/06/2021 22:17:29 - INFO - __main__ - Step 7456: {'lr': 0.0004983258647937949, 'samples': 1431552, 'steps': 7455, 'loss/train': 2.1020658016204834}} +11/06/2021 22:17:34 - INFO - __main__ - Step 7464: {'lr': 0.0004983209563136639, 'samples': 1433088, 'steps': 7463, 'loss/train': 1.939214825630188}}} +11/06/2021 22:17:35 - INFO - __main__ - Step 7468: {'lr': 0.0004983184993882394, 'samples': 1433856, 'steps': 7467, 'loss/train': 1.6667938232421875}} +11/06/2021 22:17:37 - INFO - __main__ - Step 7472: {'lr': 0.000498316040672599, 'samples': 1434624, 'steps': 7471, 'loss/train': 1.767512559890747}5}} +11/06/2021 22:17:39 - INFO - __main__ - Step 7476: {'lr': 0.0004983135801667608, 'samples': 1435392, 'steps': 7475, 'loss/train': 2.2196826934814453}} +11/06/2021 22:17:41 - INFO - __main__ - Step 7480: {'lr': 0.0004983111178707422, 'samples': 1436160, 'steps': 7479, 'loss/train': 1.5433342456817627}} +11/06/2021 22:17:43 - INFO - __main__ - Step 7484: {'lr': 0.0004983086537845611, 'samples': 1436928, 'steps': 7483, 'loss/train': 1.9418973922729492}} +11/06/2021 22:17:45 - INFO - __main__ - Step 7488: {'lr': 0.0004983061879082352, 'samples': 1437696, 'steps': 7487, 'loss/train': 2.341383218765259}}} +11/06/2021 22:17:47 - INFO - __main__ - Step 7492: {'lr': 0.0004983037202417824, 'samples': 1438464, 'steps': 7491, 'loss/train': 1.6653988361358643}} +11/06/2021 22:17:49 - INFO - __main__ - Step 7497: {'lr': 0.0004983006331413773, 'samples': 1439424, 'steps': 7496, 'loss/train': 1.6898235082626343}} +11/06/2021 22:17:51 - INFO - __main__ - Step 7501: {'lr': 0.0004982981614472039, 'samples': 1440192, 'steps': 7500, 'loss/train': 2.0123913288116455}} +11/06/2021 22:17:54 - INFO - __main__ - Step 7505: {'lr': 0.0004982956879629612, 'samples': 1440960, 'steps': 7504, 'loss/train': 2.184455633163452}}} +11/06/2021 22:17:55 - INFO - __main__ - Step 7509: {'lr': 0.0004982932126886674, 'samples': 1441728, 'steps': 7508, 'loss/train': 1.670443058013916}}} +11/06/2021 22:17:57 - INFO - __main__ - Step 7513: {'lr': 0.00049829073562434, 'samples': 1442496, 'steps': 7512, 'loss/train': 1.9669575691223145}}}} +11/06/2021 22:17:59 - INFO - __main__ - Step 7518: {'lr': 0.0004982876367767234, 'samples': 1443456, 'steps': 7517, 'loss/train': 2.108997106552124}}} +11/06/2021 22:18:01 - INFO - __main__ - Step 7522: {'lr': 0.0004982851556848861, 'samples': 1444224, 'steps': 7521, 'loss/train': 1.771378993988037}}} +11/06/2021 22:18:04 - INFO - __main__ - Step 7526: {'lr': 0.0004982826728030735, 'samples': 1444992, 'steps': 7525, 'loss/train': 1.9992296695709229}} +11/06/2021 22:18:05 - INFO - __main__ - Step 7530: {'lr': 0.0004982801881313034, 'samples': 1445760, 'steps': 7529, 'loss/train': 1.9027869701385498}} +11/06/2021 22:18:07 - INFO - __main__ - Step 7534: {'lr': 0.0004982777016695937, 'samples': 1446528, 'steps': 7533, 'loss/train': 1.1510889530181885}} +11/06/2021 22:18:07 - INFO - __main__ - Step 7534: {'lr': 0.0004982777016695937, 'samples': 1446528, 'steps': 7533, 'loss/train': 1.1510889530181885}} +11/06/2021 22:18:11 - INFO - __main__ - Step 7542: {'lr': 0.0004982727233764276, 'samples': 1448064, 'steps': 7541, 'loss/train': 1.264660120010376}}} +11/06/2021 22:18:13 - INFO - __main__ - Step 7546: {'lr': 0.0004982702315450068, 'samples': 1448832, 'steps': 7545, 'loss/train': 2.1761927604675293}} +11/06/2021 22:18:15 - INFO - __main__ - Step 7550: {'lr': 0.0004982677379237185, 'samples': 1449600, 'steps': 7549, 'loss/train': 1.834945797920227}}} +11/06/2021 22:18:18 - INFO - __main__ - Step 7555: {'lr': 0.0004982646183801337, 'samples': 1450560, 'steps': 7554, 'loss/train': 2.560479164123535}}} +11/06/2021 22:18:20 - INFO - __main__ - Step 7559: {'lr': 0.0004982621207317086, 'samples': 1451328, 'steps': 7558, 'loss/train': 1.7856800556182861}} +11/06/2021 22:18:20 - INFO - __main__ - Step 7559: {'lr': 0.0004982621207317086, 'samples': 1451328, 'steps': 7558, 'loss/train': 1.7856800556182861}} +11/06/2021 22:18:23 - INFO - __main__ - Step 7566: {'lr': 0.0004982577455402467, 'samples': 1452672, 'steps': 7565, 'loss/train': 1.7357767820358276}} +11/06/2021 22:18:25 - INFO - __main__ - Step 7571: {'lr': 0.0004982546170476494, 'samples': 1453632, 'steps': 7570, 'loss/train': 1.5686355829238892}} +11/06/2021 22:18:28 - INFO - __main__ - Step 7576: {'lr': 0.0004982514857585596, 'samples': 1454592, 'steps': 7575, 'loss/train': 1.8690491914749146}} +11/06/2021 22:18:28 - INFO - __main__ - Step 7576: {'lr': 0.0004982514857585596, 'samples': 1454592, 'steps': 7575, 'loss/train': 1.8690491914749146}} +11/06/2021 22:18:31 - INFO - __main__ - Step 7583: {'lr': 0.0004982470972557936, 'samples': 1455936, 'steps': 7582, 'loss/train': 2.4827017784118652}} +11/06/2021 22:18:33 - INFO - __main__ - Step 7587: {'lr': 0.0004982445870790823, 'samples': 1456704, 'steps': 7586, 'loss/train': 1.7887145280838013}} +11/06/2021 22:18:35 - INFO - __main__ - Step 7591: {'lr': 0.0004982420751126882, 'samples': 1457472, 'steps': 7590, 'loss/train': 2.2515952587127686}} +11/06/2021 22:18:38 - INFO - __main__ - Step 7596: {'lr': 0.0004982389326379814, 'samples': 1458432, 'steps': 7595, 'loss/train': 1.887166142463684}}} +11/06/2021 22:18:40 - INFO - __main__ - Step 7600: {'lr': 0.0004982364166448669, 'samples': 1459200, 'steps': 7599, 'loss/train': 1.9225597381591797}} +11/06/2021 22:18:41 - INFO - __main__ - Step 7604: {'lr': 0.0004982338988621284, 'samples': 1459968, 'steps': 7603, 'loss/train': 1.420168161392212}}} +11/06/2021 22:18:43 - INFO - __main__ - Step 7608: {'lr': 0.0004982313792897843, 'samples': 1460736, 'steps': 7607, 'loss/train': 1.2424761056900024}} +11/06/2021 22:18:46 - INFO - __main__ - Step 7613: {'lr': 0.0004982282273077483, 'samples': 1461696, 'steps': 7612, 'loss/train': 1.8897991180419922}} +11/06/2021 22:18:48 - INFO - __main__ - Step 7617: {'lr': 0.0004982257037088574, 'samples': 1462464, 'steps': 7616, 'loss/train': 1.82854425907135}2}} +11/06/2021 22:18:50 - INFO - __main__ - Step 7621: {'lr': 0.0004982231783204196, 'samples': 1463232, 'steps': 7620, 'loss/train': 1.768385887145996}}} +11/06/2021 22:18:51 - INFO - __main__ - Step 7625: {'lr': 0.0004982206511424534, 'samples': 1464000, 'steps': 7624, 'loss/train': 1.2371141910552979}} +11/06/2021 22:18:53 - INFO - __main__ - Step 7629: {'lr': 0.0004982181221749769, 'samples': 1464768, 'steps': 7628, 'loss/train': 2.405860424041748}}} +11/06/2021 22:18:56 - INFO - __main__ - Step 7634: {'lr': 0.0004982149584491601, 'samples': 1465728, 'steps': 7633, 'loss/train': 2.227440357208252}}} +11/06/2021 22:18:58 - INFO - __main__ - Step 7638: {'lr': 0.000498212425455352, 'samples': 1466496, 'steps': 7637, 'loss/train': 1.6778465509414673}}} +11/06/2021 22:19:00 - INFO - __main__ - Step 7642: {'lr': 0.0004982098906720928, 'samples': 1467264, 'steps': 7641, 'loss/train': 1.8286490440368652}} +11/06/2021 22:19:00 - INFO - __main__ - Step 7642: {'lr': 0.0004982098906720928, 'samples': 1467264, 'steps': 7641, 'loss/train': 1.8286490440368652}} +11/06/2021 22:19:03 - INFO - __main__ - Step 7649: {'lr': 0.0004982054504955778, 'samples': 1468608, 'steps': 7648, 'loss/train': 1.6242306232452393}} +11/06/2021 22:19:06 - INFO - __main__ - Step 7655: {'lr': 0.0004982016402683255, 'samples': 1469760, 'steps': 7654, 'loss/train': 2.361668348312378}}} +11/06/2021 22:19:08 - INFO - __main__ - Step 7659: {'lr': 0.0004981990978801035, 'samples': 1470528, 'steps': 7658, 'loss/train': 2.046013593673706}}} +11/06/2021 22:19:10 - INFO - __main__ - Step 7663: {'lr': 0.0004981965537025267, 'samples': 1471296, 'steps': 7662, 'loss/train': 2.0140273571014404}} +11/06/2021 22:19:10 - INFO - __main__ - Step 7663: {'lr': 0.0004981965537025267, 'samples': 1471296, 'steps': 7662, 'loss/train': 2.0140273571014404}} +11/06/2021 22:19:13 - INFO - __main__ - Step 7670: {'lr': 0.000498192097086187, 'samples': 1472640, 'steps': 7669, 'loss/train': 1.8466298580169678}}} +11/06/2021 22:19:15 - INFO - __main__ - Step 7675: {'lr': 0.0004981889104338499, 'samples': 1473600, 'steps': 7674, 'loss/train': 1.673049807548523}}} +11/06/2021 22:19:18 - INFO - __main__ - Step 7680: {'lr': 0.0004981857209857605, 'samples': 1474560, 'steps': 7679, 'loss/train': 2.1773593425750732}} +11/06/2021 22:19:18 - INFO - __main__ - Step 7680: {'lr': 0.0004981857209857605, 'samples': 1474560, 'steps': 7679, 'loss/train': 2.1773593425750732}} +11/06/2021 22:19:21 - INFO - __main__ - Step 7687: {'lr': 0.0004981812510616399, 'samples': 1475904, 'steps': 7686, 'loss/train': 1.9942034482955933}} +11/06/2021 22:19:23 - INFO - __main__ - Step 7691: {'lr': 0.0004981786943590928, 'samples': 1476672, 'steps': 7690, 'loss/train': 1.96816885471344}3}} +11/06/2021 22:19:26 - INFO - __main__ - Step 7696: {'lr': 0.0004981754959648376, 'samples': 1477632, 'steps': 7695, 'loss/train': 1.89278244972229}3}} +11/06/2021 22:19:26 - INFO - __main__ - Step 7696: {'lr': 0.0004981754959648376, 'samples': 1477632, 'steps': 7695, 'loss/train': 1.89278244972229}3}} +11/06/2021 22:19:30 - INFO - __main__ - Step 7704: {'lr': 0.0004981703727191935, 'samples': 1479168, 'steps': 7703, 'loss/train': 1.7264535427093506}} +11/06/2021 22:19:31 - INFO - __main__ - Step 7708: {'lr': 0.0004981678084126405, 'samples': 1479936, 'steps': 7707, 'loss/train': 1.5540006160736084}} +11/06/2021 22:19:33 - INFO - __main__ - Step 7712: {'lr': 0.0004981652423169582, 'samples': 1480704, 'steps': 7711, 'loss/train': 1.3098105192184448}} +11/06/2021 22:19:36 - INFO - __main__ - Step 7717: {'lr': 0.0004981620321814203, 'samples': 1481664, 'steps': 7716, 'loss/train': 1.9144853353500366}} +11/06/2021 22:19:38 - INFO - __main__ - Step 7722: {'lr': 0.0004981588192504329, 'samples': 1482624, 'steps': 7721, 'loss/train': 0.8639780879020691}} +11/06/2021 22:19:38 - INFO - __main__ - Step 7722: {'lr': 0.0004981588192504329, 'samples': 1482624, 'steps': 7721, 'loss/train': 0.8639780879020691}} +11/06/2021 22:19:38 - INFO - __main__ - Step 7722: {'lr': 0.0004981588192504329, 'samples': 1482624, 'steps': 7721, 'loss/train': 0.8639780879020691}} +11/06/2021 22:19:43 - INFO - __main__ - Step 7732: {'lr': 0.000498152385002254, 'samples': 1484544, 'steps': 7731, 'loss/train': 2.0949268341064453}}} +11/06/2021 22:19:46 - INFO - __main__ - Step 7738: {'lr': 0.0004981485190862737, 'samples': 1485696, 'steps': 7737, 'loss/train': 1.6075444221496582}} +11/06/2021 22:19:48 - INFO - __main__ - Step 7742: {'lr': 0.0004981459395727117, 'samples': 1486464, 'steps': 7741, 'loss/train': 2.1248600482940674}} +11/06/2021 22:19:48 - INFO - __main__ - Step 7742: {'lr': 0.0004981459395727117, 'samples': 1486464, 'steps': 7741, 'loss/train': 2.1248600482940674}} +11/06/2021 22:19:51 - INFO - __main__ - Step 7749: {'lr': 0.0004981414211192763, 'samples': 1487808, 'steps': 7748, 'loss/train': 2.3146755695343018}} +11/06/2021 22:19:53 - INFO - __main__ - Step 7753: {'lr': 0.0004981388366860869, 'samples': 1488576, 'steps': 7752, 'loss/train': 1.484642744064331}}} +11/06/2021 22:19:56 - INFO - __main__ - Step 7759: {'lr': 0.0004981349566820828, 'samples': 1489728, 'steps': 7758, 'loss/train': 1.9951647520065308}} +11/06/2021 22:19:58 - INFO - __main__ - Step 7763: {'lr': 0.0004981323677766273, 'samples': 1490496, 'steps': 7762, 'loss/train': 2.313772678375244}}} +11/06/2021 22:20:00 - INFO - __main__ - Step 7767: {'lr': 0.0004981297770822977, 'samples': 1491264, 'steps': 7766, 'loss/train': 2.1629531383514404}} +11/06/2021 22:20:00 - INFO - __main__ - Step 7767: {'lr': 0.0004981297770822977, 'samples': 1491264, 'steps': 7766, 'loss/train': 2.1629531383514404}} +11/06/2021 22:20:03 - INFO - __main__ - Step 7774: {'lr': 0.0004981252390627997, 'samples': 1492608, 'steps': 7773, 'loss/train': 2.382383108139038}}} +11/06/2021 22:20:06 - INFO - __main__ - Step 7779: {'lr': 0.000498121994266253, 'samples': 1493568, 'steps': 7778, 'loss/train': 1.9787876605987549}}} +11/06/2021 22:20:08 - INFO - __main__ - Step 7783: {'lr': 0.0004981193964166151, 'samples': 1494336, 'steps': 7782, 'loss/train': 2.476020097732544}}} +11/06/2021 22:20:10 - INFO - __main__ - Step 7787: {'lr': 0.0004981167967781968, 'samples': 1495104, 'steps': 7786, 'loss/train': 1.5972424745559692}} +11/06/2021 22:20:12 - INFO - __main__ - Step 7791: {'lr': 0.0004981141953510169, 'samples': 1495872, 'steps': 7790, 'loss/train': 1.9454317092895508}} +11/06/2021 22:20:14 - INFO - __main__ - Step 7795: {'lr': 0.0004981115921350941, 'samples': 1496640, 'steps': 7794, 'loss/train': 1.3753095865249634}} +11/06/2021 22:20:16 - INFO - __main__ - Step 7800: {'lr': 0.0004981083355997995, 'samples': 1497600, 'steps': 7799, 'loss/train': 2.574296236038208}}} +11/06/2021 22:20:16 - INFO - __main__ - Step 7800: {'lr': 0.0004981083355997995, 'samples': 1497600, 'steps': 7799, 'loss/train': 2.574296236038208}}} +11/06/2021 22:20:20 - INFO - __main__ - Step 7808: {'lr': 0.0004981031193300667, 'samples': 1499136, 'steps': 7807, 'loss/train': 1.0529712438583374}} +11/06/2021 22:20:22 - INFO - __main__ - Step 7812: {'lr': 0.0004981005085121963, 'samples': 1499904, 'steps': 7811, 'loss/train': 2.1915555000305176}} +11/06/2021 22:20:24 - INFO - __main__ - Step 7816: {'lr': 0.0004980978959056819, 'samples': 1500672, 'steps': 7815, 'loss/train': 2.804755926132202}}} +11/06/2021 22:20:24 - INFO - __main__ - Step 7816: {'lr': 0.0004980978959056819, 'samples': 1500672, 'steps': 7815, 'loss/train': 2.804755926132202}}} +11/06/2021 22:20:24 - INFO - __main__ - Step 7816: {'lr': 0.0004980978959056819, 'samples': 1500672, 'steps': 7815, 'loss/train': 2.804755926132202}}} +11/06/2021 22:20:30 - INFO - __main__ - Step 7827: {'lr': 0.0004980907020152242, 'samples': 1502784, 'steps': 7826, 'loss/train': 2.0572545528411865}} +11/06/2021 22:20:32 - INFO - __main__ - Step 7832: {'lr': 0.0004980874275935591, 'samples': 1503744, 'steps': 7831, 'loss/train': 0.8481667041778564}} +11/06/2021 22:20:35 - INFO - __main__ - Step 7837: {'lr': 0.0004980841503772846, 'samples': 1504704, 'steps': 7836, 'loss/train': 1.764209270477295}}} +11/06/2021 22:20:35 - INFO - __main__ - Step 7837: {'lr': 0.0004980841503772846, 'samples': 1504704, 'steps': 7836, 'loss/train': 1.764209270477295}}} +11/06/2021 22:20:38 - INFO - __main__ - Step 7843: {'lr': 0.0004980802140289232, 'samples': 1505856, 'steps': 7842, 'loss/train': 1.2913402318954468}} +11/06/2021 22:20:40 - INFO - __main__ - Step 7847: {'lr': 0.000498077587561056, 'samples': 1506624, 'steps': 7846, 'loss/train': 1.6562167406082153}}} +11/06/2021 22:20:40 - INFO - __main__ - Step 7847: {'lr': 0.000498077587561056, 'samples': 1506624, 'steps': 7846, 'loss/train': 1.6562167406082153}}} +11/06/2021 22:20:43 - INFO - __main__ - Step 7854: {'lr': 0.0004980729869387724, 'samples': 1507968, 'steps': 7853, 'loss/train': 1.2803887128829956}} +11/06/2021 22:20:45 - INFO - __main__ - Step 7858: {'lr': 0.0004980703555526338, 'samples': 1508736, 'steps': 7857, 'loss/train': 1.8307812213897705}} +11/06/2021 22:20:48 - INFO - __main__ - Step 7863: {'lr': 0.0004980670638049875, 'samples': 1509696, 'steps': 7862, 'loss/train': 2.1986732482910156}} +11/06/2021 22:20:50 - INFO - __main__ - Step 7867: {'lr': 0.0004980644283949152, 'samples': 1510464, 'steps': 7866, 'loss/train': 1.8365942239761353}} +11/06/2021 22:20:50 - INFO - __main__ - Step 7867: {'lr': 0.0004980644283949152, 'samples': 1510464, 'steps': 7866, 'loss/train': 1.8365942239761353}} +11/06/2021 22:20:53 - INFO - __main__ - Step 7873: {'lr': 0.0004980604719265928, 'samples': 1511616, 'steps': 7872, 'loss/train': 1.9281331300735474}} +11/06/2021 22:20:56 - INFO - __main__ - Step 7879: {'lr': 0.0004980565114344704, 'samples': 1512768, 'steps': 7878, 'loss/train': 2.003199577331543}}} +11/06/2021 22:20:58 - INFO - __main__ - Step 7883: {'lr': 0.0004980538688709761, 'samples': 1513536, 'steps': 7882, 'loss/train': 1.9707108736038208}} +11/06/2021 22:21:00 - INFO - __main__ - Step 7887: {'lr': 0.0004980512245191738, 'samples': 1514304, 'steps': 7886, 'loss/train': 2.2796289920806885}} +11/06/2021 22:21:02 - INFO - __main__ - Step 7891: {'lr': 0.0004980485783790827, 'samples': 1515072, 'steps': 7890, 'loss/train': 1.8750466108322144}} +11/06/2021 22:21:04 - INFO - __main__ - Step 7895: {'lr': 0.0004980459304507218, 'samples': 1515840, 'steps': 7894, 'loss/train': 2.0702314376831055}} +11/06/2021 22:21:06 - INFO - __main__ - Step 7899: {'lr': 0.0004980432807341102, 'samples': 1516608, 'steps': 7898, 'loss/train': 1.881008267402649}}} +11/06/2021 22:21:06 - INFO - __main__ - Step 7899: {'lr': 0.0004980432807341102, 'samples': 1516608, 'steps': 7898, 'loss/train': 1.881008267402649}}} +11/06/2021 22:21:10 - INFO - __main__ - Step 7906: {'lr': 0.0004980386394271191, 'samples': 1517952, 'steps': 7905, 'loss/train': 1.9592478275299072}} +11/06/2021 22:21:12 - INFO - __main__ - Step 7911: {'lr': 0.0004980353208549623, 'samples': 1518912, 'steps': 7910, 'loss/train': 2.016561508178711}}} +11/06/2021 22:21:12 - INFO - __main__ - Step 7911: {'lr': 0.0004980353208549623, 'samples': 1518912, 'steps': 7910, 'loss/train': 2.016561508178711}}} +11/06/2021 22:21:12 - INFO - __main__ - Step 7911: {'lr': 0.0004980353208549623, 'samples': 1518912, 'steps': 7910, 'loss/train': 2.016561508178711}}} +11/06/2021 22:21:18 - INFO - __main__ - Step 7922: {'lr': 0.0004980280101613119, 'samples': 1521024, 'steps': 7921, 'loss/train': 2.067695379257202}}} +11/06/2021 22:21:20 - INFO - __main__ - Step 7927: {'lr': 0.0004980246826484157, 'samples': 1521984, 'steps': 7926, 'loss/train': 1.8057146072387695}} +11/06/2021 22:21:20 - INFO - __main__ - Step 7927: {'lr': 0.0004980246826484157, 'samples': 1521984, 'steps': 7926, 'loss/train': 1.8057146072387695}} +11/06/2021 22:21:24 - INFO - __main__ - Step 7934: {'lr': 0.0004980200194366136, 'samples': 1523328, 'steps': 7933, 'loss/train': 1.6870510578155518}} +11/06/2021 22:21:26 - INFO - __main__ - Step 7938: {'lr': 0.0004980173522855608, 'samples': 1524096, 'steps': 7937, 'loss/train': 1.793459415435791}}} +11/06/2021 22:21:28 - INFO - __main__ - Step 7943: {'lr': 0.0004980140158323092, 'samples': 1525056, 'steps': 7942, 'loss/train': 1.4568382501602173}} +11/06/2021 22:21:28 - INFO - __main__ - Step 7943: {'lr': 0.0004980140158323092, 'samples': 1525056, 'steps': 7942, 'loss/train': 1.4568382501602173}} +11/06/2021 22:21:32 - INFO - __main__ - Step 7951: {'lr': 0.0004980086716960552, 'samples': 1526592, 'steps': 7950, 'loss/train': 2.027440071105957}}} +11/06/2021 22:21:34 - INFO - __main__ - Step 7955: {'lr': 0.0004980059969459455, 'samples': 1527360, 'steps': 7954, 'loss/train': 1.7081891298294067}} +11/06/2021 22:21:36 - INFO - __main__ - Step 7959: {'lr': 0.000498003320407873, 'samples': 1528128, 'steps': 7958, 'loss/train': 2.172380208969116}7}} +11/06/2021 22:21:38 - INFO - __main__ - Step 7964: {'lr': 0.0004979999722209891, 'samples': 1529088, 'steps': 7963, 'loss/train': 1.9147931337356567}} +11/06/2021 22:21:38 - INFO - __main__ - Step 7964: {'lr': 0.0004979999722209891, 'samples': 1529088, 'steps': 7963, 'loss/train': 1.9147931337356567}} +11/06/2021 22:21:38 - INFO - __main__ - Step 7964: {'lr': 0.0004979999722209891, 'samples': 1529088, 'steps': 7963, 'loss/train': 1.9147931337356567}} +11/06/2021 22:21:44 - INFO - __main__ - Step 7975: {'lr': 0.000497992596376341, 'samples': 1531200, 'steps': 7974, 'loss/train': 1.6081430912017822}}} +11/06/2021 22:21:47 - INFO - __main__ - Step 7980: {'lr': 0.0004979892392499932, 'samples': 1532160, 'steps': 7979, 'loss/train': 1.864031434059143}}} +11/06/2021 22:21:47 - INFO - __main__ - Step 7980: {'lr': 0.0004979892392499932, 'samples': 1532160, 'steps': 7979, 'loss/train': 1.864031434059143}}} +11/06/2021 22:21:50 - INFO - __main__ - Step 7987: {'lr': 0.0004979845345800294, 'samples': 1533504, 'steps': 7986, 'loss/train': 1.5527995824813843}} +11/06/2021 22:21:52 - INFO - __main__ - Step 7991: {'lr': 0.0004979818437389502, 'samples': 1534272, 'steps': 7990, 'loss/train': 1.586555004119873}}} +11/06/2021 22:21:55 - INFO - __main__ - Step 7996: {'lr': 0.0004979784776735257, 'samples': 1535232, 'steps': 7995, 'loss/train': 2.107032060623169}}} +11/06/2021 22:21:55 - INFO - __main__ - Step 7996: {'lr': 0.0004979784776735257, 'samples': 1535232, 'steps': 7995, 'loss/train': 2.107032060623169}}} +11/06/2021 22:21:58 - INFO - __main__ - Step 8003: {'lr': 0.0004979737604890582, 'samples': 1536576, 'steps': 8002, 'loss/train': 2.0916402339935303}} +11/06/2021 22:22:01 - INFO - __main__ - Step 8007: {'lr': 0.0004979710624969408, 'samples': 1537344, 'steps': 8006, 'loss/train': 1.6920371055603027}} +11/06/2021 22:22:02 - INFO - __main__ - Step 8011: {'lr': 0.0004979683627171125, 'samples': 1538112, 'steps': 8010, 'loss/train': 2.038038730621338}}} +11/06/2021 22:22:04 - INFO - __main__ - Step 8015: {'lr': 0.0004979656611495927, 'samples': 1538880, 'steps': 8014, 'loss/train': 2.2237470149993896}} +11/06/2021 22:22:07 - INFO - __main__ - Step 8020: {'lr': 0.0004979622816762815, 'samples': 1539840, 'steps': 8019, 'loss/train': 2.0212595462799072}} +11/06/2021 22:22:09 - INFO - __main__ - Step 8024: {'lr': 0.0004979595760865271, 'samples': 1540608, 'steps': 8023, 'loss/train': 1.602588176727295}}} +11/06/2021 22:22:09 - INFO - __main__ - Step 8024: {'lr': 0.0004979595760865271, 'samples': 1540608, 'steps': 8023, 'loss/train': 1.602588176727295}}} +11/06/2021 22:22:12 - INFO - __main__ - Step 8031: {'lr': 0.0004979548370029884, 'samples': 1541952, 'steps': 8030, 'loss/train': 1.7080976963043213}} +11/06/2021 22:22:14 - INFO - __main__ - Step 8036: {'lr': 0.0004979514485915731, 'samples': 1542912, 'steps': 8035, 'loss/train': 1.4310439825057983}} +11/06/2021 22:22:17 - INFO - __main__ - Step 8041: {'lr': 0.0004979480573870803, 'samples': 1543872, 'steps': 8040, 'loss/train': 1.2592707872390747}} +11/06/2021 22:22:19 - INFO - __main__ - Step 8045: {'lr': 0.0004979453424124961, 'samples': 1544640, 'steps': 8044, 'loss/train': 1.2424389123916626}} +11/06/2021 22:22:21 - INFO - __main__ - Step 8049: {'lr': 0.0004979426256503863, 'samples': 1545408, 'steps': 8048, 'loss/train': 2.2753522396087646}} +11/06/2021 22:22:21 - INFO - __main__ - Step 8049: {'lr': 0.0004979426256503863, 'samples': 1545408, 'steps': 8048, 'loss/train': 2.2753522396087646}} +11/06/2021 22:22:24 - INFO - __main__ - Step 8056: {'lr': 0.00049793786701552, 'samples': 1546752, 'steps': 8055, 'loss/train': 1.7011387348175049}6}} +11/06/2021 22:22:24 - INFO - __main__ - Step 8056: {'lr': 0.00049793786701552, 'samples': 1546752, 'steps': 8055, 'loss/train': 1.7011387348175049}6}} +11/06/2021 22:22:24 - INFO - __main__ - Step 8056: {'lr': 0.00049793786701552, 'samples': 1546752, 'steps': 8055, 'loss/train': 1.7011387348175049}6}} +11/06/2021 22:22:30 - INFO - __main__ - Step 8068: {'lr': 0.0004979296966200718, 'samples': 1549056, 'steps': 8067, 'loss/train': 1.7086400985717773}} +11/06/2021 22:22:32 - INFO - __main__ - Step 8073: {'lr': 0.0004979262875407896, 'samples': 1550016, 'steps': 8072, 'loss/train': 1.3283685445785522}} +11/06/2021 22:22:32 - INFO - __main__ - Step 8073: {'lr': 0.0004979262875407896, 'samples': 1550016, 'steps': 8072, 'loss/train': 1.3283685445785522}} +11/06/2021 22:22:36 - INFO - __main__ - Step 8079: {'lr': 0.0004979221929591663, 'samples': 1551168, 'steps': 8078, 'loss/train': 2.025535821914673}}} +11/06/2021 22:22:39 - INFO - __main__ - Step 8085: {'lr': 0.000497918094355986, 'samples': 1552320, 'steps': 8084, 'loss/train': 1.904146671295166}}}} +11/06/2021 22:22:41 - INFO - __main__ - Step 8089: {'lr': 0.0004979153597197003, 'samples': 1553088, 'steps': 8088, 'loss/train': 1.035143256187439}}} +11/06/2021 22:22:41 - INFO - __main__ - Step 8089: {'lr': 0.0004979153597197003, 'samples': 1553088, 'steps': 8088, 'loss/train': 1.035143256187439}}} +11/06/2021 22:22:44 - INFO - __main__ - Step 8096: {'lr': 0.0004979105698054992, 'samples': 1554432, 'steps': 8095, 'loss/train': 2.0879011154174805}} +11/06/2021 22:22:47 - INFO - __main__ - Step 8101: {'lr': 0.0004979071450870662, 'samples': 1555392, 'steps': 8100, 'loss/train': 1.7830842733383179}} +11/06/2021 22:22:49 - INFO - __main__ - Step 8106: {'lr': 0.0004979037175760548, 'samples': 1556352, 'steps': 8105, 'loss/train': 2.045214891433716}}} +11/06/2021 22:22:49 - INFO - __main__ - Step 8106: {'lr': 0.0004979037175760548, 'samples': 1556352, 'steps': 8105, 'loss/train': 2.045214891433716}}} +11/06/2021 22:22:49 - INFO - __main__ - Step 8106: {'lr': 0.0004979037175760548, 'samples': 1556352, 'steps': 8105, 'loss/train': 2.045214891433716}}} +11/06/2021 22:22:54 - INFO - __main__ - Step 8116: {'lr': 0.0004978968541764515, 'samples': 1558272, 'steps': 8115, 'loss/train': 2.9898436069488525}} +11/06/2021 22:22:57 - INFO - __main__ - Step 8121: {'lr': 0.0004978934182879369, 'samples': 1559232, 'steps': 8120, 'loss/train': 1.8195523023605347}} +11/06/2021 22:22:59 - INFO - __main__ - Step 8125: {'lr': 0.0004978906675665782, 'samples': 1560000, 'steps': 8124, 'loss/train': 2.085545063018799}}} +11/06/2021 22:23:00 - INFO - __main__ - Step 8129: {'lr': 0.0004978879150580882, 'samples': 1560768, 'steps': 8128, 'loss/train': 1.8509951829910278}} +11/06/2021 22:23:00 - INFO - __main__ - Step 8129: {'lr': 0.0004978879150580882, 'samples': 1560768, 'steps': 8128, 'loss/train': 1.8509951829910278}} +11/06/2021 22:23:05 - INFO - __main__ - Step 8137: {'lr': 0.0004978824046797935, 'samples': 1562304, 'steps': 8136, 'loss/train': 2.647218942642212}}} +11/06/2021 22:23:06 - INFO - __main__ - Step 8141: {'lr': 0.0004978796468100286, 'samples': 1563072, 'steps': 8140, 'loss/train': 1.7271705865859985}} +11/06/2021 22:23:09 - INFO - __main__ - Step 8146: {'lr': 0.0004978761969597831, 'samples': 1564032, 'steps': 8145, 'loss/train': 2.357698917388916}}} +11/06/2021 22:23:11 - INFO - __main__ - Step 8150: {'lr': 0.0004978734350691793, 'samples': 1564800, 'steps': 8149, 'loss/train': 1.4162994623184204}} +11/06/2021 22:23:13 - INFO - __main__ - Step 8154: {'lr': 0.0004978706713915684, 'samples': 1565568, 'steps': 8153, 'loss/train': 1.7779927253723145}} +11/06/2021 22:23:13 - INFO - __main__ - Step 8154: {'lr': 0.0004978706713915684, 'samples': 1565568, 'steps': 8153, 'loss/train': 1.7779927253723145}} +11/06/2021 22:23:16 - INFO - __main__ - Step 8161: {'lr': 0.0004978658306558234, 'samples': 1566912, 'steps': 8160, 'loss/train': 1.9604636430740356}} +11/06/2021 22:23:19 - INFO - __main__ - Step 8166: {'lr': 0.0004978623696368924, 'samples': 1567872, 'steps': 8165, 'loss/train': 1.8691977262496948}} +11/06/2021 22:23:19 - INFO - __main__ - Step 8166: {'lr': 0.0004978623696368924, 'samples': 1567872, 'steps': 8165, 'loss/train': 1.8691977262496948}} +11/06/2021 22:23:23 - INFO - __main__ - Step 8174: {'lr': 0.0004978568261991051, 'samples': 1569408, 'steps': 8173, 'loss/train': 1.6820038557052612}} +11/06/2021 22:23:24 - INFO - __main__ - Step 8178: {'lr': 0.0004978540517998704, 'samples': 1570176, 'steps': 8177, 'loss/train': 1.511248230934143}}} +11/06/2021 22:23:26 - INFO - __main__ - Step 8182: {'lr': 0.0004978512756137684, 'samples': 1570944, 'steps': 8181, 'loss/train': 2.5265679359436035}} +11/06/2021 22:23:29 - INFO - __main__ - Step 8187: {'lr': 0.000497847802868389, 'samples': 1571904, 'steps': 8186, 'loss/train': 1.9279881715774536}}} +11/06/2021 22:23:29 - INFO - __main__ - Step 8187: {'lr': 0.000497847802868389, 'samples': 1571904, 'steps': 8186, 'loss/train': 1.9279881715774536}}} +11/06/2021 22:23:33 - INFO - __main__ - Step 8195: {'lr': 0.0004978422406686257, 'samples': 1573440, 'steps': 8194, 'loss/train': 1.9039665460586548}} +11/06/2021 22:23:35 - INFO - __main__ - Step 8199: {'lr': 0.0004978394568885608, 'samples': 1574208, 'steps': 8198, 'loss/train': 1.7852051258087158}} +11/06/2021 22:23:37 - INFO - __main__ - Step 8203: {'lr': 0.0004978366713217336, 'samples': 1574976, 'steps': 8202, 'loss/train': 1.418635368347168}}} +11/06/2021 22:23:39 - INFO - __main__ - Step 8208: {'lr': 0.000497833186850596, 'samples': 1575936, 'steps': 8207, 'loss/train': 1.9825032949447632}}} +11/06/2021 22:23:41 - INFO - __main__ - Step 8212: {'lr': 0.0004978303972636275, 'samples': 1576704, 'steps': 8211, 'loss/train': 1.6517690420150757}} +11/06/2021 22:23:43 - INFO - __main__ - Step 8216: {'lr': 0.000497827605889962, 'samples': 1577472, 'steps': 8215, 'loss/train': 1.8105554580688477}}} +11/06/2021 22:23:45 - INFO - __main__ - Step 8220: {'lr': 0.0004978248127296198, 'samples': 1578240, 'steps': 8219, 'loss/train': 2.2303905487060547}} +11/06/2021 22:23:47 - INFO - __main__ - Step 8224: {'lr': 0.0004978220177826212, 'samples': 1579008, 'steps': 8223, 'loss/train': 1.977313756942749}}} +11/06/2021 22:23:49 - INFO - __main__ - Step 8229: {'lr': 0.0004978185215864177, 'samples': 1579968, 'steps': 8228, 'loss/train': 1.8177608251571655}} +11/06/2021 22:23:51 - INFO - __main__ - Step 8233: {'lr': 0.0004978157226195153, 'samples': 1580736, 'steps': 8232, 'loss/train': 1.4781603813171387}} +11/06/2021 22:23:53 - INFO - __main__ - Step 8237: {'lr': 0.000497812921866022, 'samples': 1581504, 'steps': 8236, 'loss/train': 2.0580477714538574}}} +11/06/2021 22:23:55 - INFO - __main__ - Step 8241: {'lr': 0.0004978101193259578, 'samples': 1582272, 'steps': 8240, 'loss/train': 0.3795441687107086}} +11/06/2021 22:23:57 - INFO - __main__ - Step 8245: {'lr': 0.000497807314999343, 'samples': 1583040, 'steps': 8244, 'loss/train': 1.9589273929595947}}} +11/06/2021 22:23:59 - INFO - __main__ - Step 8250: {'lr': 0.0004978038070787683, 'samples': 1584000, 'steps': 8249, 'loss/train': 2.009343147277832}}} +11/06/2021 22:24:01 - INFO - __main__ - Step 8254: {'lr': 0.0004978009987324884, 'samples': 1584768, 'steps': 8253, 'loss/train': 1.9142787456512451}} +11/06/2021 22:24:03 - INFO - __main__ - Step 8258: {'lr': 0.0004977981885997235, 'samples': 1585536, 'steps': 8257, 'loss/train': 1.3908742666244507}} +11/06/2021 22:24:05 - INFO - __main__ - Step 8262: {'lr': 0.0004977953766804941, 'samples': 1586304, 'steps': 8261, 'loss/train': 1.7750216722488403}} +11/06/2021 22:24:07 - INFO - __main__ - Step 8266: {'lr': 0.0004977925629748203, 'samples': 1587072, 'steps': 8265, 'loss/train': 1.8348907232284546}} +11/06/2021 22:24:09 - INFO - __main__ - Step 8271: {'lr': 0.0004977890433305716, 'samples': 1588032, 'steps': 8270, 'loss/train': 2.1743407249450684}} +11/06/2021 22:24:12 - INFO - __main__ - Step 8275: {'lr': 0.0004977862256054721, 'samples': 1588800, 'steps': 8274, 'loss/train': 1.8264741897583008}} +11/06/2021 22:24:14 - INFO - __main__ - Step 8279: {'lr': 0.0004977834060939943, 'samples': 1589568, 'steps': 8278, 'loss/train': 1.6243547201156616}} +11/06/2021 22:24:15 - INFO - __main__ - Step 8283: {'lr': 0.0004977805847961584, 'samples': 1590336, 'steps': 8282, 'loss/train': 1.9494577646255493}} +11/06/2021 22:24:17 - INFO - __main__ - Step 8287: {'lr': 0.0004977777617119847, 'samples': 1591104, 'steps': 8286, 'loss/train': 1.8675819635391235}} +11/06/2021 22:24:20 - INFO - __main__ - Step 8292: {'lr': 0.0004977742303447613, 'samples': 1592064, 'steps': 8291, 'loss/train': 2.4035115242004395}} +11/06/2021 22:24:22 - INFO - __main__ - Step 8296: {'lr': 0.0004977714032414021, 'samples': 1592832, 'steps': 8295, 'loss/train': 1.709094762802124}}} +11/06/2021 22:24:22 - INFO - __main__ - Step 8296: {'lr': 0.0004977714032414021, 'samples': 1592832, 'steps': 8295, 'loss/train': 1.709094762802124}}} +11/06/2021 22:24:25 - INFO - __main__ - Step 8303: {'lr': 0.0004977664515123201, 'samples': 1594176, 'steps': 8302, 'loss/train': 1.8622348308563232}} +11/06/2021 22:24:27 - INFO - __main__ - Step 8307: {'lr': 0.0004977636194967634, 'samples': 1594944, 'steps': 8306, 'loss/train': 2.114375591278076}}} +11/06/2021 22:24:29 - INFO - __main__ - Step 8312: {'lr': 0.0004977600769654545, 'samples': 1595904, 'steps': 8311, 'loss/train': 1.5743494033813477}} +11/06/2021 22:24:31 - INFO - __main__ - Step 8316: {'lr': 0.0004977572409309418, 'samples': 1596672, 'steps': 8315, 'loss/train': 1.7749756574630737}} +11/06/2021 22:24:34 - INFO - __main__ - Step 8320: {'lr': 0.0004977544031102597, 'samples': 1597440, 'steps': 8319, 'loss/train': 1.7613978385925293}} +11/06/2021 22:24:35 - INFO - __main__ - Step 8324: {'lr': 0.0004977515635034285, 'samples': 1598208, 'steps': 8323, 'loss/train': 1.7190172672271729}} +11/06/2021 22:24:37 - INFO - __main__ - Step 8328: {'lr': 0.000497748722110469, 'samples': 1598976, 'steps': 8327, 'loss/train': 3.0373826026916504}}} +11/06/2021 22:24:40 - INFO - __main__ - Step 8333: {'lr': 0.0004977451678575575, 'samples': 1599936, 'steps': 8332, 'loss/train': 1.207032561302185}}} +11/06/2021 22:24:40 - INFO - __main__ - Step 8333: {'lr': 0.0004977451678575575, 'samples': 1599936, 'steps': 8332, 'loss/train': 1.207032561302185}}} +11/06/2021 22:24:43 - INFO - __main__ - Step 8340: {'lr': 0.0004977401872150241, 'samples': 1601280, 'steps': 8339, 'loss/train': 1.857647180557251}}} +11/06/2021 22:24:45 - INFO - __main__ - Step 8344: {'lr': 0.0004977373386777554, 'samples': 1602048, 'steps': 8343, 'loss/train': 2.0518319606781006}} +11/06/2021 22:24:47 - INFO - __main__ - Step 8349: {'lr': 0.0004977337754945731, 'samples': 1603008, 'steps': 8348, 'loss/train': 1.9418188333511353}} +11/06/2021 22:24:47 - INFO - __main__ - Step 8349: {'lr': 0.0004977337754945731, 'samples': 1603008, 'steps': 8348, 'loss/train': 1.9418188333511353}} +11/06/2021 22:24:52 - INFO - __main__ - Step 8357: {'lr': 0.0004977280685969971, 'samples': 1604544, 'steps': 8356, 'loss/train': 2.2838523387908936}} +11/06/2021 22:24:54 - INFO - __main__ - Step 8361: {'lr': 0.0004977252124692601, 'samples': 1605312, 'steps': 8360, 'loss/train': 1.8619705438613892}} +11/06/2021 22:24:55 - INFO - __main__ - Step 8365: {'lr': 0.0004977223545555847, 'samples': 1606080, 'steps': 8364, 'loss/train': 1.9046440124511719}} +11/06/2021 22:24:57 - INFO - __main__ - Step 8369: {'lr': 0.0004977194948559913, 'samples': 1606848, 'steps': 8368, 'loss/train': 1.6611480712890625}} +11/06/2021 22:24:59 - INFO - __main__ - Step 8373: {'lr': 0.0004977166333705005, 'samples': 1607616, 'steps': 8372, 'loss/train': 1.0230144262313843}} +11/06/2021 22:25:01 - INFO - __main__ - Step 8377: {'lr': 0.0004977137700991332, 'samples': 1608384, 'steps': 8376, 'loss/train': 1.4530218839645386}} +11/06/2021 22:25:03 - INFO - __main__ - Step 8381: {'lr': 0.0004977109050419097, 'samples': 1609152, 'steps': 8380, 'loss/train': 2.402639150619507}}} +11/06/2021 22:25:05 - INFO - __main__ - Step 8385: {'lr': 0.000497708038198851, 'samples': 1609920, 'steps': 8384, 'loss/train': 1.6063017845153809}}} +11/06/2021 22:25:07 - INFO - __main__ - Step 8390: {'lr': 0.000497704452133728, 'samples': 1610880, 'steps': 8389, 'loss/train': 2.0732336044311523}}} +11/06/2021 22:25:07 - INFO - __main__ - Step 8390: {'lr': 0.000497704452133728, 'samples': 1610880, 'steps': 8389, 'loss/train': 2.0732336044311523}}} +11/06/2021 22:25:11 - INFO - __main__ - Step 8398: {'lr': 0.0004976987086257342, 'samples': 1612416, 'steps': 8397, 'loss/train': 1.0962588787078857}} +11/06/2021 22:25:13 - INFO - __main__ - Step 8402: {'lr': 0.0004976958341931057, 'samples': 1613184, 'steps': 8401, 'loss/train': 1.0811164379119873}} +11/06/2021 22:25:15 - INFO - __main__ - Step 8406: {'lr': 0.0004976929579747505, 'samples': 1613952, 'steps': 8405, 'loss/train': 1.7756294012069702}} +11/06/2021 22:25:17 - INFO - __main__ - Step 8411: {'lr': 0.00049768936019066, 'samples': 1614912, 'steps': 8410, 'loss/train': 1.824702262878418}02}} +11/06/2021 22:25:17 - INFO - __main__ - Step 8411: {'lr': 0.00049768936019066, 'samples': 1614912, 'steps': 8410, 'loss/train': 1.824702262878418}02}} +11/06/2021 22:25:21 - INFO - __main__ - Step 8419: {'lr': 0.0004976835979326718, 'samples': 1616448, 'steps': 8418, 'loss/train': 1.5903434753417969}} +11/06/2021 22:25:21 - INFO - __main__ - Step 8419: {'lr': 0.0004976835979326718, 'samples': 1616448, 'steps': 8418, 'loss/train': 1.5903434753417969}} +11/06/2021 22:25:25 - INFO - __main__ - Step 8426: {'lr': 0.0004976785500978, 'samples': 1617792, 'steps': 8425, 'loss/train': 1.5716438293457031}69}} +11/06/2021 22:25:27 - INFO - __main__ - Step 8431: {'lr': 0.0004976749411534525, 'samples': 1618752, 'steps': 8430, 'loss/train': 1.566307783126831}}} +11/06/2021 22:25:29 - INFO - __main__ - Step 8435: {'lr': 0.0004976720519891994, 'samples': 1619520, 'steps': 8434, 'loss/train': 1.7268136739730835}} +11/06/2021 22:25:31 - INFO - __main__ - Step 8439: {'lr': 0.0004976691610393911, 'samples': 1620288, 'steps': 8438, 'loss/train': 2.1499216556549072}} +11/06/2021 22:25:33 - INFO - __main__ - Step 8443: {'lr': 0.0004976662683040484, 'samples': 1621056, 'steps': 8442, 'loss/train': 1.7835140228271484}} +11/06/2021 22:25:35 - INFO - __main__ - Step 8448: {'lr': 0.000497662649873994, 'samples': 1622016, 'steps': 8447, 'loss/train': 1.2889354228973389}}} +11/06/2021 22:25:37 - INFO - __main__ - Step 8452: {'lr': 0.000497659753121275, 'samples': 1622784, 'steps': 8451, 'loss/train': 2.0676944255828857}}} +11/06/2021 22:25:37 - INFO - __main__ - Step 8452: {'lr': 0.000497659753121275, 'samples': 1622784, 'steps': 8451, 'loss/train': 2.0676944255828857}}} +11/06/2021 22:25:41 - INFO - __main__ - Step 8459: {'lr': 0.0004976546795077503, 'samples': 1624128, 'steps': 8458, 'loss/train': 2.1664505004882812}} +11/06/2021 22:25:43 - INFO - __main__ - Step 8464: {'lr': 0.000497651052150402, 'samples': 1625088, 'steps': 8463, 'loss/train': 1.3184614181518555}}} +11/06/2021 22:25:45 - INFO - __main__ - Step 8468: {'lr': 0.0004976481482559421, 'samples': 1625856, 'steps': 8467, 'loss/train': 1.5242974758148193}} +11/06/2021 22:25:48 - INFO - __main__ - Step 8473: {'lr': 0.0004976445158771748, 'samples': 1626816, 'steps': 8472, 'loss/train': 1.7219116687774658}} +11/06/2021 22:25:50 - INFO - __main__ - Step 8477: {'lr': 0.0004976416079656328, 'samples': 1627584, 'steps': 8476, 'loss/train': 2.3073718547821045}} +11/06/2021 22:25:52 - INFO - __main__ - Step 8481: {'lr': 0.0004976386982687549, 'samples': 1628352, 'steps': 8480, 'loss/train': 1.8894435167312622}} +11/06/2021 22:25:53 - INFO - __main__ - Step 8485: {'lr': 0.0004976357867865621, 'samples': 1629120, 'steps': 8484, 'loss/train': 1.8762072324752808}} +11/06/2021 22:25:56 - INFO - __main__ - Step 8490: {'lr': 0.0004976321449232542, 'samples': 1630080, 'steps': 8489, 'loss/train': 1.4703295230865479}} +11/06/2021 22:25:58 - INFO - __main__ - Step 8494: {'lr': 0.0004976292294241798, 'samples': 1630848, 'steps': 8493, 'loss/train': 1.3954660892486572}} +11/06/2021 22:26:00 - INFO - __main__ - Step 8498: {'lr': 0.000497626312139859, 'samples': 1631616, 'steps': 8497, 'loss/train': 1.7845796346664429}}} +11/06/2021 22:26:02 - INFO - __main__ - Step 8502: {'lr': 0.0004976233930703126, 'samples': 1632384, 'steps': 8501, 'loss/train': 1.7581290006637573}} +11/06/2021 22:26:03 - INFO - __main__ - Step 8506: {'lr': 0.0004976204722155617, 'samples': 1633152, 'steps': 8505, 'loss/train': 1.7833354473114014}} +11/06/2021 22:26:06 - INFO - __main__ - Step 8510: {'lr': 0.0004976175495756274, 'samples': 1633920, 'steps': 8509, 'loss/train': 1.9994100332260132}} +11/06/2021 22:26:06 - INFO - __main__ - Step 8510: {'lr': 0.0004976175495756274, 'samples': 1633920, 'steps': 8509, 'loss/train': 1.9994100332260132}} +11/06/2021 22:26:10 - INFO - __main__ - Step 8518: {'lr': 0.0004976116989402929, 'samples': 1635456, 'steps': 8517, 'loss/train': 1.7013543844223022}} +11/06/2021 22:26:11 - INFO - __main__ - Step 8522: {'lr': 0.0004976087709449348, 'samples': 1636224, 'steps': 8521, 'loss/train': 1.6207133531570435}} +11/06/2021 22:26:13 - INFO - __main__ - Step 8526: {'lr': 0.0004976058411644777, 'samples': 1636992, 'steps': 8525, 'loss/train': 1.7340941429138184}} +11/06/2021 22:26:16 - INFO - __main__ - Step 8531: {'lr': 0.000497602176428643, 'samples': 1637952, 'steps': 8530, 'loss/train': 2.355168342590332}4}} +11/06/2021 22:26:18 - INFO - __main__ - Step 8536: {'lr': 0.0004975985089036652, 'samples': 1638912, 'steps': 8535, 'loss/train': 1.7440499067306519}} +11/06/2021 22:26:18 - INFO - __main__ - Step 8536: {'lr': 0.0004975985089036652, 'samples': 1638912, 'steps': 8535, 'loss/train': 1.7440499067306519}} +11/06/2021 22:26:22 - INFO - __main__ - Step 8543: {'lr': 0.0004975933696830147, 'samples': 1640256, 'steps': 8542, 'loss/train': 1.9213240146636963}} +11/06/2021 22:26:23 - INFO - __main__ - Step 8547: {'lr': 0.0004975904305311344, 'samples': 1641024, 'steps': 8546, 'loss/train': 2.413429021835327}}} +11/06/2021 22:26:26 - INFO - __main__ - Step 8551: {'lr': 0.0004975874895942872, 'samples': 1641792, 'steps': 8550, 'loss/train': 1.2816332578659058}} +11/06/2021 22:26:28 - INFO - __main__ - Step 8555: {'lr': 0.0004975845468724944, 'samples': 1642560, 'steps': 8554, 'loss/train': 1.236737847328186}}} +11/06/2021 22:26:30 - INFO - __main__ - Step 8559: {'lr': 0.000497581602365777, 'samples': 1643328, 'steps': 8558, 'loss/train': 2.347743511199951}}}} +11/06/2021 22:26:32 - INFO - __main__ - Step 8564: {'lr': 0.0004975779192223629, 'samples': 1644288, 'steps': 8563, 'loss/train': 1.7488797903060913}} +11/06/2021 22:26:34 - INFO - __main__ - Step 8568: {'lr': 0.0004975749706996433, 'samples': 1645056, 'steps': 8567, 'loss/train': 1.9086993932724}13}} +11/06/2021 22:26:36 - INFO - __main__ - Step 8572: {'lr': 0.0004975720203920683, 'samples': 1645824, 'steps': 8571, 'loss/train': 2.3485770225524902}} +11/06/2021 22:26:38 - INFO - __main__ - Step 8576: {'lr': 0.0004975690682996592, 'samples': 1646592, 'steps': 8575, 'loss/train': 1.9467846155166626}} +11/06/2021 22:26:40 - INFO - __main__ - Step 8580: {'lr': 0.0004975661144224374, 'samples': 1647360, 'steps': 8579, 'loss/train': 2.0112924575805664}} +11/06/2021 22:26:40 - INFO - __main__ - Step 8580: {'lr': 0.0004975661144224374, 'samples': 1647360, 'steps': 8579, 'loss/train': 2.0112924575805664}} +11/06/2021 22:26:44 - INFO - __main__ - Step 8587: {'lr': 0.0004975609408426572, 'samples': 1648704, 'steps': 8586, 'loss/train': 1.84238600730896}4}} +11/06/2021 22:26:46 - INFO - __main__ - Step 8591: {'lr': 0.0004975579820573099, 'samples': 1649472, 'steps': 8590, 'loss/train': 1.5335558652877808}} +11/06/2021 22:26:48 - INFO - __main__ - Step 8596: {'lr': 0.0004975542810658476, 'samples': 1650432, 'steps': 8595, 'loss/train': 1.850310206413269}}} +11/06/2021 22:26:48 - INFO - __main__ - Step 8596: {'lr': 0.0004975542810658476, 'samples': 1650432, 'steps': 8595, 'loss/train': 1.850310206413269}}} +11/06/2021 22:26:52 - INFO - __main__ - Step 8603: {'lr': 0.0004975490949929558, 'samples': 1651776, 'steps': 8602, 'loss/train': 1.782822608947754}}} +11/06/2021 22:26:54 - INFO - __main__ - Step 8607: {'lr': 0.000497546129068805, 'samples': 1652544, 'steps': 8606, 'loss/train': 1.4670497179031372}}} +11/06/2021 22:26:56 - INFO - __main__ - Step 8612: {'lr': 0.0004975424191539585, 'samples': 1653504, 'steps': 8611, 'loss/train': 1.8894764184951782}} +11/06/2021 22:26:58 - INFO - __main__ - Step 8616: {'lr': 0.0004975394492143808, 'samples': 1654272, 'steps': 8615, 'loss/train': 2.525263547897339}}} +11/06/2021 22:26:58 - INFO - __main__ - Step 8616: {'lr': 0.0004975394492143808, 'samples': 1654272, 'steps': 8615, 'loss/train': 2.525263547897339}}} +11/06/2021 22:27:02 - INFO - __main__ - Step 8623: {'lr': 0.000497534247525941, 'samples': 1655616, 'steps': 8622, 'loss/train': 1.932421326637268}}}} +11/06/2021 22:27:04 - INFO - __main__ - Step 8628: {'lr': 0.0004975305286881383, 'samples': 1656576, 'steps': 8627, 'loss/train': 1.7895426750183105}} +11/06/2021 22:27:06 - INFO - __main__ - Step 8632: {'lr': 0.0004975275516102922, 'samples': 1657344, 'steps': 8631, 'loss/train': 1.7859746217727661}} +11/06/2021 22:27:08 - INFO - __main__ - Step 8636: {'lr': 0.0004975245727479325, 'samples': 1658112, 'steps': 8635, 'loss/train': 1.8529094457626343}} +11/06/2021 22:27:10 - INFO - __main__ - Step 8640: {'lr': 0.0004975215921010808, 'samples': 1658880, 'steps': 8639, 'loss/train': 1.9541411399841309}} +11/06/2021 22:27:10 - INFO - __main__ - Step 8640: {'lr': 0.0004975215921010808, 'samples': 1658880, 'steps': 8639, 'loss/train': 1.9541411399841309}} +11/06/2021 22:27:14 - INFO - __main__ - Step 8647: {'lr': 0.000497516371675221, 'samples': 1660224, 'steps': 8646, 'loss/train': 2.2316641807556152}}} +11/06/2021 22:27:16 - INFO - __main__ - Step 8651: {'lr': 0.000497513386121127, 'samples': 1660992, 'steps': 8650, 'loss/train': 1.510509729385376}}}} +11/06/2021 22:27:18 - INFO - __main__ - Step 8655: {'lr': 0.0004975103987826217, 'samples': 1661760, 'steps': 8654, 'loss/train': 1.5138027667999268}} +11/06/2021 22:27:20 - INFO - __main__ - Step 8660: {'lr': 0.0004975066621001943, 'samples': 1662720, 'steps': 8659, 'loss/train': 1.1997767686843872}} +11/06/2021 22:27:20 - INFO - __main__ - Step 8660: {'lr': 0.0004975066621001943, 'samples': 1662720, 'steps': 8659, 'loss/train': 1.1997767686843872}} +11/06/2021 22:27:24 - INFO - __main__ - Step 8668: {'lr': 0.0004975006776091484, 'samples': 1664256, 'steps': 8667, 'loss/train': 1.9532525539398193}} +11/06/2021 22:27:26 - INFO - __main__ - Step 8672: {'lr': 0.000497497682687135, 'samples': 1665024, 'steps': 8671, 'loss/train': 1.5913190841674805}}} +11/06/2021 22:27:28 - INFO - __main__ - Step 8676: {'lr': 0.0004974946859808235, 'samples': 1665792, 'steps': 8675, 'loss/train': 1.5062406063079834}} +11/06/2021 22:27:30 - INFO - __main__ - Step 8681: {'lr': 0.0004974909375887976, 'samples': 1666752, 'steps': 8680, 'loss/train': 1.7356830835342407}} +11/06/2021 22:27:32 - INFO - __main__ - Step 8686: {'lr': 0.0004974871864088818, 'samples': 1667712, 'steps': 8685, 'loss/train': 1.7284247875213623}} +11/06/2021 22:27:32 - INFO - __main__ - Step 8686: {'lr': 0.0004974871864088818, 'samples': 1667712, 'steps': 8685, 'loss/train': 1.7284247875213623}} +11/06/2021 22:27:36 - INFO - __main__ - Step 8693: {'lr': 0.000497481930073425, 'samples': 1669056, 'steps': 8692, 'loss/train': 1.9291731119155884}}} +11/06/2021 22:27:38 - INFO - __main__ - Step 8697: {'lr': 0.0004974789239999027, 'samples': 1669824, 'steps': 8696, 'loss/train': 1.7184191942214966}} +11/06/2021 22:27:40 - INFO - __main__ - Step 8702: {'lr': 0.0004974751638990233, 'samples': 1670784, 'steps': 8701, 'loss/train': 1.9571999311447144}} +11/06/2021 22:27:43 - INFO - __main__ - Step 8706: {'lr': 0.0004974721538111649, 'samples': 1671552, 'steps': 8705, 'loss/train': 1.7644202709197998}} +11/06/2021 22:27:45 - INFO - __main__ - Step 8710: {'lr': 0.0004974691419391922, 'samples': 1672320, 'steps': 8709, 'loss/train': 1.8900412321090698}} +11/06/2021 22:27:46 - INFO - __main__ - Step 8714: {'lr': 0.0004974661282831272, 'samples': 1673088, 'steps': 8713, 'loss/train': 1.890992522239685}}} +11/06/2021 22:27:48 - INFO - __main__ - Step 8718: {'lr': 0.0004974631128429915, 'samples': 1673856, 'steps': 8717, 'loss/train': 2.640268564224243}}} +11/06/2021 22:27:48 - INFO - __main__ - Step 8718: {'lr': 0.0004974631128429915, 'samples': 1673856, 'steps': 8717, 'loss/train': 2.640268564224243}}} +11/06/2021 22:27:52 - INFO - __main__ - Step 8726: {'lr': 0.000497457076610595, 'samples': 1675392, 'steps': 8725, 'loss/train': 1.7877483367919922}}} +11/06/2021 22:27:52 - INFO - __main__ - Step 8726: {'lr': 0.000497457076610595, 'samples': 1675392, 'steps': 8725, 'loss/train': 1.7877483367919922}}} +11/06/2021 22:27:55 - INFO - __main__ - Step 8733: {'lr': 0.0004974517890534742, 'samples': 1676736, 'steps': 8732, 'loss/train': 2.029585361480713}}} +11/06/2021 22:27:58 - INFO - __main__ - Step 8738: {'lr': 0.0004974480088820139, 'samples': 1677696, 'steps': 8737, 'loss/train': 1.93135666847229}}}} +11/06/2021 22:27:58 - INFO - __main__ - Step 8738: {'lr': 0.0004974480088820139, 'samples': 1677696, 'steps': 8737, 'loss/train': 1.93135666847229}}}} +11/06/2021 22:28:01 - INFO - __main__ - Step 8745: {'lr': 0.0004974427119591361, 'samples': 1679040, 'steps': 8744, 'loss/train': 2.352595090866089}}} +11/06/2021 22:28:03 - INFO - __main__ - Step 8749: {'lr': 0.0004974396826931906, 'samples': 1679808, 'steps': 8748, 'loss/train': 2.0725631713867188}} +11/06/2021 22:28:06 - INFO - __main__ - Step 8754: {'lr': 0.00049743589360218, 'samples': 1680768, 'steps': 8753, 'loss/train': 2.1746933460235596}8}} +11/06/2021 22:28:08 - INFO - __main__ - Step 8759: {'lr': 0.0004974321017238994, 'samples': 1681728, 'steps': 8758, 'loss/train': 1.5569329261779785}} +11/06/2021 22:28:10 - INFO - __main__ - Step 8763: {'lr': 0.0004974290662144694, 'samples': 1682496, 'steps': 8762, 'loss/train': 1.675337791442871}}} +11/06/2021 22:28:10 - INFO - __main__ - Step 8763: {'lr': 0.0004974290662144694, 'samples': 1682496, 'steps': 8762, 'loss/train': 1.675337791442871}}} +11/06/2021 22:28:13 - INFO - __main__ - Step 8770: {'lr': 0.0004974237497807027, 'samples': 1683840, 'steps': 8769, 'loss/train': 0.3073934018611908}} +11/06/2021 22:28:16 - INFO - __main__ - Step 8775: {'lr': 0.0004974199489834457, 'samples': 1684800, 'steps': 8774, 'loss/train': 1.757877230644226}}} +11/06/2021 22:28:18 - INFO - __main__ - Step 8779: {'lr': 0.000497416906338933, 'samples': 1685568, 'steps': 8778, 'loss/train': 2.1888182163238525}}} +11/06/2021 22:28:20 - INFO - __main__ - Step 8784: {'lr': 0.0004974131005249444, 'samples': 1686528, 'steps': 8783, 'loss/train': 1.3217498064041138}} +11/06/2021 22:28:20 - INFO - __main__ - Step 8784: {'lr': 0.0004974131005249444, 'samples': 1686528, 'steps': 8783, 'loss/train': 1.3217498064041138}} +11/06/2021 22:28:24 - INFO - __main__ - Step 8791: {'lr': 0.0004974077677031879, 'samples': 1687872, 'steps': 8790, 'loss/train': 1.7749842405319214}} +11/06/2021 22:28:26 - INFO - __main__ - Step 8795: {'lr': 0.0004974047179239436, 'samples': 1688640, 'steps': 8794, 'loss/train': 1.9513581991195679}} +11/06/2021 22:28:28 - INFO - __main__ - Step 8800: {'lr': 0.000497400903191664, 'samples': 1689600, 'steps': 8799, 'loss/train': 1.5480501651763916}}} +11/06/2021 22:28:30 - INFO - __main__ - Step 8805: {'lr': 0.0004973970856725086, 'samples': 1690560, 'steps': 8804, 'loss/train': 1.862740159034729}}} +11/06/2021 22:28:30 - INFO - __main__ - Step 8805: {'lr': 0.0004973970856725086, 'samples': 1690560, 'steps': 8804, 'loss/train': 1.862740159034729}}} +11/06/2021 22:28:34 - INFO - __main__ - Step 8812: {'lr': 0.0004973917364638218, 'samples': 1691904, 'steps': 8811, 'loss/train': 1.7712737321853638}} +11/06/2021 22:28:36 - INFO - __main__ - Step 8816: {'lr': 0.0004973886773207763, 'samples': 1692672, 'steps': 8815, 'loss/train': 1.6713685989379883}} +11/06/2021 22:28:38 - INFO - __main__ - Step 8820: {'lr': 0.0004973856163942185, 'samples': 1693440, 'steps': 8819, 'loss/train': 1.8286590576171875}} +11/06/2021 22:28:41 - INFO - __main__ - Step 8826: {'lr': 0.0004973810216603443, 'samples': 1694592, 'steps': 8825, 'loss/train': 0.3064444959163666}} +11/06/2021 22:28:43 - INFO - __main__ - Step 8830: {'lr': 0.0004973779562751022, 'samples': 1695360, 'steps': 8829, 'loss/train': 1.7933107614517212}} +11/06/2021 22:28:43 - INFO - __main__ - Step 8830: {'lr': 0.0004973779562751022, 'samples': 1695360, 'steps': 8829, 'loss/train': 1.7933107614517212}} +11/06/2021 22:28:46 - INFO - __main__ - Step 8837: {'lr': 0.0004973725875595513, 'samples': 1696704, 'steps': 8836, 'loss/train': 2.336061716079712}}} +11/06/2021 22:28:48 - INFO - __main__ - Step 8841: {'lr': 0.000497369517269916, 'samples': 1697472, 'steps': 8840, 'loss/train': 2.1014244556427}12}}} +11/06/2021 22:28:50 - INFO - __main__ - Step 8846: {'lr': 0.0004973656769000046, 'samples': 1698432, 'steps': 8845, 'loss/train': 1.0025054216384888}} +11/06/2021 22:28:53 - INFO - __main__ - Step 8850: {'lr': 0.0004973626025978086, 'samples': 1699200, 'steps': 8849, 'loss/train': 1.551592469215393}}} +11/06/2021 22:28:55 - INFO - __main__ - Step 8854: {'lr': 0.0004973595265122883, 'samples': 1699968, 'steps': 8853, 'loss/train': 2.4081969261169434}} +11/06/2021 22:28:56 - INFO - __main__ - Step 8858: {'lr': 0.0004973564486434656, 'samples': 1700736, 'steps': 8857, 'loss/train': 1.6520261764526367}} +11/06/2021 22:28:58 - INFO - __main__ - Step 8862: {'lr': 0.0004973533689913631, 'samples': 1701504, 'steps': 8861, 'loss/train': 1.570049524307251}}} +11/06/2021 22:29:01 - INFO - __main__ - Step 8867: {'lr': 0.0004973495169185313, 'samples': 1702464, 'steps': 8866, 'loss/train': 1.2922062873840332}} +11/06/2021 22:29:03 - INFO - __main__ - Step 8871: {'lr': 0.00049734643325413, 'samples': 1703232, 'steps': 8870, 'loss/train': 1.7162529230117798}2}} +11/06/2021 22:29:05 - INFO - __main__ - Step 8875: {'lr': 0.0004973433478065209, 'samples': 1704000, 'steps': 8874, 'loss/train': 1.6638219356536865}} +11/06/2021 22:29:05 - INFO - __main__ - Step 8875: {'lr': 0.0004973433478065209, 'samples': 1704000, 'steps': 8874, 'loss/train': 1.6638219356536865}} +11/06/2021 22:29:08 - INFO - __main__ - Step 8882: {'lr': 0.0004973379439824283, 'samples': 1705344, 'steps': 8881, 'loss/train': 2.2020576000213623}} +11/06/2021 22:29:11 - INFO - __main__ - Step 8887: {'lr': 0.0004973340807646696, 'samples': 1706304, 'steps': 8886, 'loss/train': 2.3790831565856934}} +11/06/2021 22:29:13 - INFO - __main__ - Step 8891: {'lr': 0.000497330988184452, 'samples': 1707072, 'steps': 8890, 'loss/train': 1.9604440927505493}}} +11/06/2021 22:29:13 - INFO - __main__ - Step 8891: {'lr': 0.000497330988184452, 'samples': 1707072, 'steps': 8890, 'loss/train': 1.9604440927505493}}} +11/06/2021 22:29:16 - INFO - __main__ - Step 8898: {'lr': 0.0004973255718785088, 'samples': 1708416, 'steps': 8897, 'loss/train': 1.7817871570587158}} +11/06/2021 22:29:18 - INFO - __main__ - Step 8903: {'lr': 0.00049732169974531, 'samples': 1709376, 'steps': 8902, 'loss/train': 1.8295646905899048}8}} +11/06/2021 22:29:21 - INFO - __main__ - Step 8908: {'lr': 0.0004973178248261274, 'samples': 1710336, 'steps': 8907, 'loss/train': 2.1482808589935303}} +11/06/2021 22:29:23 - INFO - __main__ - Step 8912: {'lr': 0.0004973147228849027, 'samples': 1711104, 'steps': 8911, 'loss/train': 1.924820065498352}}} +11/06/2021 22:29:23 - INFO - __main__ - Step 8912: {'lr': 0.0004973147228849027, 'samples': 1711104, 'steps': 8911, 'loss/train': 1.924820065498352}}} +11/06/2021 22:29:26 - INFO - __main__ - Step 8919: {'lr': 0.000497309290197479, 'samples': 1712448, 'steps': 8918, 'loss/train': 1.6200121641159058}}} +11/06/2021 22:29:28 - INFO - __main__ - Step 8924: {'lr': 0.0004973054063634428, 'samples': 1713408, 'steps': 8923, 'loss/train': 1.9554498195648193}} +11/06/2021 22:29:31 - INFO - __main__ - Step 8929: {'lr': 0.0004973015197436063, 'samples': 1714368, 'steps': 8928, 'loss/train': 3.589097023010254}}} +11/06/2021 22:29:31 - INFO - __main__ - Step 8929: {'lr': 0.0004973015197436063, 'samples': 1714368, 'steps': 8928, 'loss/train': 3.589097023010254}}} +11/06/2021 22:29:34 - INFO - __main__ - Step 8936: {'lr': 0.0004972960737957749, 'samples': 1715712, 'steps': 8935, 'loss/train': 1.9268077611923218}} +11/06/2021 22:29:36 - INFO - __main__ - Step 8940: {'lr': 0.0004972929593741662, 'samples': 1716480, 'steps': 8939, 'loss/train': 1.9634605646133423}} +11/06/2021 22:29:36 - INFO - __main__ - Step 8940: {'lr': 0.0004972929593741662, 'samples': 1716480, 'steps': 8939, 'loss/train': 1.9634605646133423}} +11/06/2021 22:29:41 - INFO - __main__ - Step 8948: {'lr': 0.0004972867251825048, 'samples': 1718016, 'steps': 8947, 'loss/train': 2.001603841781616}}} +11/06/2021 22:29:42 - INFO - __main__ - Step 8952: {'lr': 0.0004972836054124968, 'samples': 1718784, 'steps': 8951, 'loss/train': 1.9462846517562866}} +11/06/2021 22:29:44 - INFO - __main__ - Step 8956: {'lr': 0.000497280483859734, 'samples': 1719552, 'steps': 8955, 'loss/train': 1.3424328565597534}}} +11/06/2021 22:29:47 - INFO - __main__ - Step 8961: {'lr': 0.0004972765794118158, 'samples': 1720512, 'steps': 8960, 'loss/train': 1.1508708000183105}} +11/06/2021 22:29:49 - INFO - __main__ - Step 8965: {'lr': 0.0004972734538479369, 'samples': 1721280, 'steps': 8964, 'loss/train': 2.106870174407959}}} +11/06/2021 22:29:51 - INFO - __main__ - Step 8969: {'lr': 0.0004972703265013764, 'samples': 1722048, 'steps': 8968, 'loss/train': 1.7631484270095825}} +11/06/2021 22:29:51 - INFO - __main__ - Step 8969: {'lr': 0.0004972703265013764, 'samples': 1722048, 'steps': 8968, 'loss/train': 1.7631484270095825}} +11/06/2021 22:29:54 - INFO - __main__ - Step 8976: {'lr': 0.0004972648493553856, 'samples': 1723392, 'steps': 8975, 'loss/train': 1.3855030536651611}} +11/06/2021 22:29:57 - INFO - __main__ - Step 8982: {'lr': 0.0004972601503136822, 'samples': 1724544, 'steps': 8981, 'loss/train': 1.6659023761749268}} +11/06/2021 22:29:57 - INFO - __main__ - Step 8982: {'lr': 0.0004972601503136822, 'samples': 1724544, 'steps': 8981, 'loss/train': 1.6659023761749268}} +11/06/2021 22:30:01 - INFO - __main__ - Step 8989: {'lr': 0.0004972546630291387, 'samples': 1725888, 'steps': 8988, 'loss/train': 1.9944013357162476}} +11/06/2021 22:30:02 - INFO - __main__ - Step 8993: {'lr': 0.0004972515249869622, 'samples': 1726656, 'steps': 8992, 'loss/train': 1.706042766571045}}} +11/06/2021 22:30:04 - INFO - __main__ - Step 8997: {'lr': 0.0004972483851622623, 'samples': 1727424, 'steps': 8996, 'loss/train': 2.627495527267456}}} +11/06/2021 22:30:07 - INFO - __main__ - Step 9002: {'lr': 0.000497244457874748, 'samples': 1728384, 'steps': 9001, 'loss/train': 1.736275315284729}}}} +11/06/2021 22:30:09 - INFO - __main__ - Step 9006: {'lr': 0.0004972413140394528, 'samples': 1729152, 'steps': 9005, 'loss/train': 2.118058204650879}}} +11/06/2021 22:30:11 - INFO - __main__ - Step 9010: {'lr': 0.0004972381684217077, 'samples': 1729920, 'steps': 9009, 'loss/train': 1.8316234350204468}} +11/06/2021 22:30:12 - INFO - __main__ - Step 9014: {'lr': 0.0004972350210215353, 'samples': 1730688, 'steps': 9013, 'loss/train': 1.3896691799163818}} +11/06/2021 22:30:14 - INFO - __main__ - Step 9018: {'lr': 0.0004972318718389583, 'samples': 1731456, 'steps': 9017, 'loss/train': 2.1753854751586914}} +11/06/2021 22:30:17 - INFO - __main__ - Step 9023: {'lr': 0.0004972279328542652, 'samples': 1732416, 'steps': 9022, 'loss/train': 2.2019128799438477}} +11/06/2021 22:30:19 - INFO - __main__ - Step 9027: {'lr': 0.0004972247796613611, 'samples': 1733184, 'steps': 9026, 'loss/train': 1.2223052978515625}} +11/06/2021 22:30:21 - INFO - __main__ - Step 9031: {'lr': 0.0004972216246861262, 'samples': 1733952, 'steps': 9030, 'loss/train': 2.1160690784454346}} +11/06/2021 22:30:22 - INFO - __main__ - Step 9035: {'lr': 0.0004972184679285833, 'samples': 1734720, 'steps': 9034, 'loss/train': 1.6166201829910278}} +11/06/2021 22:30:24 - INFO - __main__ - Step 9039: {'lr': 0.0004972153093887551, 'samples': 1735488, 'steps': 9038, 'loss/train': 1.671932578086853}}} +11/06/2021 22:30:27 - INFO - __main__ - Step 9044: {'lr': 0.000497211358707666, 'samples': 1736448, 'steps': 9043, 'loss/train': 1.862133502960205}}}} +11/06/2021 22:30:27 - INFO - __main__ - Step 9044: {'lr': 0.000497211358707666, 'samples': 1736448, 'steps': 9043, 'loss/train': 1.862133502960205}}}} +11/06/2021 22:30:30 - INFO - __main__ - Step 9050: {'lr': 0.0004972066142145055, 'samples': 1737600, 'steps': 9049, 'loss/train': 1.216286540031433}}} +11/06/2021 22:30:32 - INFO - __main__ - Step 9055: {'lr': 0.0004972026574070459, 'samples': 1738560, 'steps': 9054, 'loss/train': 2.233604907989502}}} +11/06/2021 22:30:35 - INFO - __main__ - Step 9060: {'lr': 0.0004971986978149437, 'samples': 1739520, 'steps': 9059, 'loss/train': 1.568691372871399}}} +11/06/2021 22:30:37 - INFO - __main__ - Step 9064: {'lr': 0.0004971955281363493, 'samples': 1740288, 'steps': 9063, 'loss/train': 1.9272085428237915}} +11/06/2021 22:30:37 - INFO - __main__ - Step 9064: {'lr': 0.0004971955281363493, 'samples': 1740288, 'steps': 9063, 'loss/train': 1.9272085428237915}} +11/06/2021 22:30:40 - INFO - __main__ - Step 9071: {'lr': 0.000497189976910597, 'samples': 1741632, 'steps': 9070, 'loss/train': 2.2380783557891846}}} +11/06/2021 22:30:42 - INFO - __main__ - Step 9075: {'lr': 0.000497186802331228, 'samples': 1742400, 'steps': 9074, 'loss/train': 2.291787624359131}}}} +11/06/2021 22:30:42 - INFO - __main__ - Step 9075: {'lr': 0.000497186802331228, 'samples': 1742400, 'steps': 9074, 'loss/train': 2.291787624359131}}}} +11/06/2021 22:30:47 - INFO - __main__ - Step 9084: {'lr': 0.0004971796530120371, 'samples': 1744128, 'steps': 9083, 'loss/train': 1.885785460472107}}} +11/06/2021 22:30:49 - INFO - __main__ - Step 9088: {'lr': 0.0004971764726410668, 'samples': 1744896, 'steps': 9087, 'loss/train': 1.8160526752471924}} +11/06/2021 22:30:50 - INFO - __main__ - Step 9092: {'lr': 0.000497173290488114, 'samples': 1745664, 'steps': 9091, 'loss/train': 1.6177334785461426}}} +11/06/2021 22:30:53 - INFO - __main__ - Step 9096: {'lr': 0.0004971701065532017, 'samples': 1746432, 'steps': 9095, 'loss/train': 1.4940237998962402}} +11/06/2021 22:30:53 - INFO - __main__ - Step 9096: {'lr': 0.0004971701065532017, 'samples': 1746432, 'steps': 9095, 'loss/train': 1.4940237998962402}} +11/06/2021 22:30:56 - INFO - __main__ - Step 9104: {'lr': 0.0004971637333375904, 'samples': 1747968, 'steps': 9103, 'loss/train': 1.4513171911239624}} +11/06/2021 22:30:58 - INFO - __main__ - Step 9108: {'lr': 0.0004971605440569374, 'samples': 1748736, 'steps': 9107, 'loss/train': 1.783698558807373}}} +11/06/2021 22:31:01 - INFO - __main__ - Step 9113: {'lr': 0.0004971565549503723, 'samples': 1749696, 'steps': 9112, 'loss/train': 2.295679807662964}}} +11/06/2021 22:31:03 - INFO - __main__ - Step 9117: {'lr': 0.0004971533616605495, 'samples': 1750464, 'steps': 9116, 'loss/train': 1.4062687158584595}} +11/06/2021 22:31:05 - INFO - __main__ - Step 9121: {'lr': 0.0004971501665889107, 'samples': 1751232, 'steps': 9120, 'loss/train': 1.5485329627990723}} +11/06/2021 22:31:06 - INFO - __main__ - Step 9125: {'lr': 0.0004971469697354792, 'samples': 1752000, 'steps': 9124, 'loss/train': 2.1170740127563477}} +11/06/2021 22:31:09 - INFO - __main__ - Step 9129: {'lr': 0.0004971437711002777, 'samples': 1752768, 'steps': 9128, 'loss/train': 1.880787968635559}}} +11/06/2021 22:31:11 - INFO - __main__ - Step 9134: {'lr': 0.0004971397703006974, 'samples': 1753728, 'steps': 9133, 'loss/train': 2.073517322540283}}} +11/06/2021 22:31:13 - INFO - __main__ - Step 9138: {'lr': 0.0004971365676565984, 'samples': 1754496, 'steps': 9137, 'loss/train': 1.9141130447387695}} +11/06/2021 22:31:15 - INFO - __main__ - Step 9142: {'lr': 0.0004971333632308047, 'samples': 1755264, 'steps': 9141, 'loss/train': 2.0353739261627197}} +11/06/2021 22:31:17 - INFO - __main__ - Step 9146: {'lr': 0.0004971301570233392, 'samples': 1756032, 'steps': 9145, 'loss/train': 2.155123472213745}}} +11/06/2021 22:31:19 - INFO - __main__ - Step 9150: {'lr': 0.0004971269490342252, 'samples': 1756800, 'steps': 9149, 'loss/train': 1.6433255672454834}} +11/06/2021 22:31:21 - INFO - __main__ - Step 9155: {'lr': 0.0004971229365424246, 'samples': 1757760, 'steps': 9154, 'loss/train': 1.973191738128662}}} +11/06/2021 22:31:23 - INFO - __main__ - Step 9159: {'lr': 0.0004971197245446859, 'samples': 1758528, 'steps': 9158, 'loss/train': 2.273866891860962}}} +11/06/2021 22:31:23 - INFO - __main__ - Step 9159: {'lr': 0.0004971197245446859, 'samples': 1758528, 'steps': 9158, 'loss/train': 2.273866891860962}}} +11/06/2021 22:31:26 - INFO - __main__ - Step 9166: {'lr': 0.0004971140992617462, 'samples': 1759872, 'steps': 9165, 'loss/train': 1.977513074874878}}} +11/06/2021 22:31:29 - INFO - __main__ - Step 9171: {'lr': 0.0004971100778621223, 'samples': 1760832, 'steps': 9170, 'loss/train': 1.477123498916626}}} +11/06/2021 22:31:31 - INFO - __main__ - Step 9176: {'lr': 0.0004971060536788988, 'samples': 1761792, 'steps': 9175, 'loss/train': 1.9381426572799683}} +11/06/2021 22:31:33 - INFO - __main__ - Step 9180: {'lr': 0.0004971028323281586, 'samples': 1762560, 'steps': 9179, 'loss/train': 2.6767475605010986}} +11/06/2021 22:31:35 - INFO - __main__ - Step 9184: {'lr': 0.0004970996091959668, 'samples': 1763328, 'steps': 9183, 'loss/train': 1.487623691558838}}} +11/06/2021 22:31:37 - INFO - __main__ - Step 9188: {'lr': 0.0004970963842823468, 'samples': 1764096, 'steps': 9187, 'loss/train': 1.1920486688613892}} +11/06/2021 22:31:39 - INFO - __main__ - Step 9192: {'lr': 0.0004970931575873215, 'samples': 1764864, 'steps': 9191, 'loss/train': 1.533847451210022}}} +11/06/2021 22:31:39 - INFO - __main__ - Step 9192: {'lr': 0.0004970931575873215, 'samples': 1764864, 'steps': 9191, 'loss/train': 1.533847451210022}}} +11/06/2021 22:31:43 - INFO - __main__ - Step 9199: {'lr': 0.0004970875065845914, 'samples': 1766208, 'steps': 9198, 'loss/train': 2.0182600021362305}} +11/06/2021 22:31:45 - INFO - __main__ - Step 9203: {'lr': 0.0004970842749908223, 'samples': 1766976, 'steps': 9202, 'loss/train': 1.710228443145752}}} +11/06/2021 22:31:47 - INFO - __main__ - Step 9208: {'lr': 0.0004970802329936355, 'samples': 1767936, 'steps': 9207, 'loss/train': 1.110896110534668}}} +11/06/2021 22:31:47 - INFO - __main__ - Step 9208: {'lr': 0.0004970802329936355, 'samples': 1767936, 'steps': 9207, 'loss/train': 1.110896110534668}}} +11/06/2021 22:31:51 - INFO - __main__ - Step 9216: {'lr': 0.0004970737600089673, 'samples': 1769472, 'steps': 9215, 'loss/train': 2.018321990966797}}} +11/06/2021 22:31:53 - INFO - __main__ - Step 9220: {'lr': 0.0004970705208447587, 'samples': 1770240, 'steps': 9219, 'loss/train': 1.9058424234390259}} +11/06/2021 22:31:55 - INFO - __main__ - Step 9225: {'lr': 0.0004970664693846618, 'samples': 1771200, 'steps': 9224, 'loss/train': 1.7904118299484253}} +11/06/2021 22:31:55 - INFO - __main__ - Step 9225: {'lr': 0.0004970664693846618, 'samples': 1771200, 'steps': 9224, 'loss/train': 1.7904118299484253}} +11/06/2021 22:31:59 - INFO - __main__ - Step 9233: {'lr': 0.0004970599812596603, 'samples': 1772736, 'steps': 9232, 'loss/train': 1.2998876571655273}} +11/06/2021 22:32:02 - INFO - __main__ - Step 9237: {'lr': 0.0004970567345254339, 'samples': 1773504, 'steps': 9236, 'loss/train': 1.544152021408081}}} +11/06/2021 22:32:03 - INFO - __main__ - Step 9241: {'lr': 0.0004970534860100883, 'samples': 1774272, 'steps': 9240, 'loss/train': 1.7890807390213013}} +11/06/2021 22:32:05 - INFO - __main__ - Step 9245: {'lr': 0.0004970502357136468, 'samples': 1775040, 'steps': 9244, 'loss/train': 1.9643011093139648}} +11/06/2021 22:32:07 - INFO - __main__ - Step 9250: {'lr': 0.0004970461703384647, 'samples': 1776000, 'steps': 9249, 'loss/train': 1.9446792602539062}} +11/06/2021 22:32:07 - INFO - __main__ - Step 9250: {'lr': 0.0004970461703384647, 'samples': 1776000, 'steps': 9249, 'loss/train': 1.9446792602539062}} +11/06/2021 22:32:10 - INFO - __main__ - Step 9256: {'lr': 0.0004970412882148488, 'samples': 1777152, 'steps': 9255, 'loss/train': 1.1907613277435303}} +11/06/2021 22:32:13 - INFO - __main__ - Step 9261: {'lr': 0.0004970372167173915, 'samples': 1778112, 'steps': 9260, 'loss/train': 2.010669708251953}}} +11/06/2021 22:32:15 - INFO - __main__ - Step 9266: {'lr': 0.0004970331424371555, 'samples': 1779072, 'steps': 9265, 'loss/train': 1.760794997215271}}} +11/06/2021 22:32:15 - INFO - __main__ - Step 9266: {'lr': 0.0004970331424371555, 'samples': 1779072, 'steps': 9265, 'loss/train': 1.760794997215271}}} +11/06/2021 22:32:19 - INFO - __main__ - Step 9273: {'lr': 0.0004970274337698436, 'samples': 1780416, 'steps': 9272, 'loss/train': 1.789774775505066}}} +11/06/2021 22:32:21 - INFO - __main__ - Step 9278: {'lr': 0.0004970233528111253, 'samples': 1781376, 'steps': 9277, 'loss/train': 1.9275052547454834}} +11/06/2021 22:32:23 - INFO - __main__ - Step 9282: {'lr': 0.0004970200860406601, 'samples': 1782144, 'steps': 9281, 'loss/train': 1.4385563135147095}} +11/06/2021 22:32:25 - INFO - __main__ - Step 9287: {'lr': 0.0004970160000732539, 'samples': 1783104, 'steps': 9286, 'loss/train': 1.7004362344741821}} +11/06/2021 22:32:25 - INFO - __main__ - Step 9287: {'lr': 0.0004970160000732539, 'samples': 1783104, 'steps': 9286, 'loss/train': 1.7004362344741821}} +11/06/2021 22:32:29 - INFO - __main__ - Step 9294: {'lr': 0.0004970102750442285, 'samples': 1784448, 'steps': 9293, 'loss/train': 2.1833393573760986}} +11/06/2021 22:32:31 - INFO - __main__ - Step 9298: {'lr': 0.0004970070011504846, 'samples': 1785216, 'steps': 9297, 'loss/train': 1.8061836957931519}} +11/06/2021 22:32:33 - INFO - __main__ - Step 9303: {'lr': 0.0004970029062791128, 'samples': 1786176, 'steps': 9302, 'loss/train': 1.933624505996704}}} +11/06/2021 22:32:35 - INFO - __main__ - Step 9307: {'lr': 0.0004969996283786905, 'samples': 1786944, 'steps': 9306, 'loss/train': 1.8101203441619873}} +11/06/2021 22:32:37 - INFO - __main__ - Step 9311: {'lr': 0.0004969963486975607, 'samples': 1787712, 'steps': 9310, 'loss/train': 1.2041494846343994}} +11/06/2021 22:32:39 - INFO - __main__ - Step 9315: {'lr': 0.0004969930672357471, 'samples': 1788480, 'steps': 9314, 'loss/train': 2.183551788330078}}} +11/06/2021 22:32:41 - INFO - __main__ - Step 9319: {'lr': 0.0004969897839932732, 'samples': 1789248, 'steps': 9318, 'loss/train': 1.988546371459961}}} +11/06/2021 22:32:43 - INFO - __main__ - Step 9324: {'lr': 0.0004969856774361634, 'samples': 1790208, 'steps': 9323, 'loss/train': 1.9644792079925537}} +11/06/2021 22:32:46 - INFO - __main__ - Step 9328: {'lr': 0.0004969823901872906, 'samples': 1790976, 'steps': 9327, 'loss/train': 2.1059629917144775}} +11/06/2021 22:32:48 - INFO - __main__ - Step 9332: {'lr': 0.0004969791011578344, 'samples': 1791744, 'steps': 9331, 'loss/train': 1.9717392921447754}} +11/06/2021 22:32:49 - INFO - __main__ - Step 9336: {'lr': 0.0004969758103478187, 'samples': 1792512, 'steps': 9335, 'loss/train': 1.6776036024093628}} +11/06/2021 22:32:51 - INFO - __main__ - Step 9340: {'lr': 0.0004969725177572672, 'samples': 1793280, 'steps': 9339, 'loss/train': 1.5066814422607422}} +11/06/2021 22:32:53 - INFO - __main__ - Step 9345: {'lr': 0.0004969683995152355, 'samples': 1794240, 'steps': 9344, 'loss/train': 3.186241626739502}}} +11/06/2021 22:32:53 - INFO - __main__ - Step 9345: {'lr': 0.0004969683995152355, 'samples': 1794240, 'steps': 9344, 'loss/train': 3.186241626739502}}} +11/06/2021 22:32:57 - INFO - __main__ - Step 9352: {'lr': 0.0004969626293026353, 'samples': 1795584, 'steps': 9351, 'loss/train': 1.7228342294692993}} +11/06/2021 22:32:59 - INFO - __main__ - Step 9356: {'lr': 0.0004969593295901779, 'samples': 1796352, 'steps': 9355, 'loss/train': 1.998396873474121}}} +11/06/2021 22:33:01 - INFO - __main__ - Step 9361: {'lr': 0.0004969552024458976, 'samples': 1797312, 'steps': 9360, 'loss/train': 1.6986967325210571}} +11/06/2021 22:33:01 - INFO - __main__ - Step 9361: {'lr': 0.0004969552024458976, 'samples': 1797312, 'steps': 9360, 'loss/train': 1.6986967325210571}} +11/06/2021 22:33:05 - INFO - __main__ - Step 9369: {'lr': 0.00049694859322881, 'samples': 1798848, 'steps': 9368, 'loss/train': 1.7562119960784912}1}} +11/06/2021 22:33:08 - INFO - __main__ - Step 9373: {'lr': 0.0004969452859497449, 'samples': 1799616, 'steps': 9372, 'loss/train': 1.927634596824646}}} +11/06/2021 22:33:09 - INFO - __main__ - Step 9377: {'lr': 0.000496941976890364, 'samples': 1800384, 'steps': 9376, 'loss/train': 1.6627328395843506}}} +11/06/2021 22:33:09 - INFO - __main__ - Step 9377: {'lr': 0.000496941976890364, 'samples': 1800384, 'steps': 9376, 'loss/train': 1.6627328395843506}}} +11/06/2021 22:33:09 - INFO - __main__ - Step 9377: {'lr': 0.000496941976890364, 'samples': 1800384, 'steps': 9376, 'loss/train': 1.6627328395843506}}} +11/06/2021 22:33:15 - INFO - __main__ - Step 9388: {'lr': 0.0004969328677975083, 'samples': 1802496, 'steps': 9387, 'loss/train': 1.6319315433502197}} +11/06/2021 22:33:17 - INFO - __main__ - Step 9393: {'lr': 0.0004969287228501602, 'samples': 1803456, 'steps': 9392, 'loss/train': 1.8238893747329712}} +11/06/2021 22:33:19 - INFO - __main__ - Step 9397: {'lr': 0.0004969254048895585, 'samples': 1804224, 'steps': 9396, 'loss/train': 1.8003126382827759}} +11/06/2021 22:33:22 - INFO - __main__ - Step 9401: {'lr': 0.0004969220851487844, 'samples': 1804992, 'steps': 9400, 'loss/train': 0.40175554156303406} +11/06/2021 22:33:23 - INFO - __main__ - Step 9405: {'lr': 0.000496918763627862, 'samples': 1805760, 'steps': 9404, 'loss/train': 1.7720991373062134}6} +11/06/2021 22:33:25 - INFO - __main__ - Step 9409: {'lr': 0.0004969154403268148, 'samples': 1806528, 'steps': 9408, 'loss/train': 1.8082882165908813}} +11/06/2021 22:33:27 - INFO - __main__ - Step 9414: {'lr': 0.0004969112836972423, 'samples': 1807488, 'steps': 9413, 'loss/train': 1.678197979927063}}} +11/06/2021 22:33:27 - INFO - __main__ - Step 9414: {'lr': 0.0004969112836972423, 'samples': 1807488, 'steps': 9413, 'loss/train': 1.678197979927063}}} +11/06/2021 22:33:32 - INFO - __main__ - Step 9422: {'lr': 0.0004969046273047161, 'samples': 1809024, 'steps': 9421, 'loss/train': 1.61650812625885}}}} +11/06/2021 22:33:34 - INFO - __main__ - Step 9427: {'lr': 0.0004969004634437042, 'samples': 1809984, 'steps': 9426, 'loss/train': 1.5909390449523926}} +11/06/2021 22:33:35 - INFO - __main__ - Step 9431: {'lr': 0.0004968971303524007, 'samples': 1810752, 'steps': 9430, 'loss/train': 1.2849524021148682}} +11/06/2021 22:33:37 - INFO - __main__ - Step 9435: {'lr': 0.0004968937954811284, 'samples': 1811520, 'steps': 9434, 'loss/train': 1.701316237449646}}} +11/06/2021 22:33:40 - INFO - __main__ - Step 9440: {'lr': 0.0004968896243889941, 'samples': 1812480, 'steps': 9439, 'loss/train': 1.6848827600479126}} +11/06/2021 22:33:42 - INFO - __main__ - Step 9444: {'lr': 0.0004968862855128806, 'samples': 1813248, 'steps': 9443, 'loss/train': 1.394817590713501}}} +11/06/2021 22:33:44 - INFO - __main__ - Step 9448: {'lr': 0.0004968829448568766, 'samples': 1814016, 'steps': 9447, 'loss/train': 1.6947396993637085}} +11/06/2021 22:33:46 - INFO - __main__ - Step 9452: {'lr': 0.0004968796024210064, 'samples': 1814784, 'steps': 9451, 'loss/train': 1.934395670890808}}} +11/06/2021 22:33:47 - INFO - __main__ - Step 9456: {'lr': 0.0004968762582052938, 'samples': 1815552, 'steps': 9455, 'loss/train': 1.959632396697998}}} +11/06/2021 22:33:49 - INFO - __main__ - Step 9460: {'lr': 0.0004968729122097632, 'samples': 1816320, 'steps': 9459, 'loss/train': 1.9877064228057861}} +11/06/2021 22:33:52 - INFO - __main__ - Step 9465: {'lr': 0.0004968687272125174, 'samples': 1817280, 'steps': 9464, 'loss/train': 1.5592188835144043}} +11/06/2021 22:33:52 - INFO - __main__ - Step 9465: {'lr': 0.0004968687272125174, 'samples': 1817280, 'steps': 9464, 'loss/train': 1.5592188835144043}} +11/06/2021 22:33:55 - INFO - __main__ - Step 9472: {'lr': 0.000496862863544504, 'samples': 1818624, 'steps': 9471, 'loss/train': 1.4764689207077026}}} +11/06/2021 22:33:57 - INFO - __main__ - Step 9476: {'lr': 0.0004968595104299422, 'samples': 1819392, 'steps': 9475, 'loss/train': 2.2946574687957764}} +11/06/2021 22:33:59 - INFO - __main__ - Step 9481: {'lr': 0.0004968553165340435, 'samples': 1820352, 'steps': 9480, 'loss/train': 1.7705086469650269}} +11/06/2021 22:33:59 - INFO - __main__ - Step 9481: {'lr': 0.0004968553165340435, 'samples': 1820352, 'steps': 9480, 'loss/train': 1.7705086469650269}} +11/06/2021 22:34:04 - INFO - __main__ - Step 9489: {'lr': 0.0004968486005167069, 'samples': 1821888, 'steps': 9488, 'loss/train': 1.7480806112289429}} +11/06/2021 22:34:05 - INFO - __main__ - Step 9493: {'lr': 0.0004968452398385984, 'samples': 1822656, 'steps': 9492, 'loss/train': 1.734236240386963}}} +11/06/2021 22:34:07 - INFO - __main__ - Step 9497: {'lr': 0.0004968418773808954, 'samples': 1823424, 'steps': 9496, 'loss/train': 1.705300211906433}}} +11/06/2021 22:34:10 - INFO - __main__ - Step 9502: {'lr': 0.0004968376718062488, 'samples': 1824384, 'steps': 9501, 'loss/train': 1.9032224416732788}} +11/06/2021 22:34:12 - INFO - __main__ - Step 9506: {'lr': 0.0004968343053445469, 'samples': 1825152, 'steps': 9505, 'loss/train': 1.723289132118225}}} +11/06/2021 22:34:14 - INFO - __main__ - Step 9510: {'lr': 0.0004968309371033293, 'samples': 1825920, 'steps': 9509, 'loss/train': 1.9803547859191895}} +11/06/2021 22:34:15 - INFO - __main__ - Step 9514: {'lr': 0.0004968275670826204, 'samples': 1826688, 'steps': 9513, 'loss/train': 1.7052531242370605}} +11/06/2021 22:34:17 - INFO - __main__ - Step 9518: {'lr': 0.0004968241952824442, 'samples': 1827456, 'steps': 9517, 'loss/train': 1.6158838272094727}} +11/06/2021 22:34:20 - INFO - __main__ - Step 9523: {'lr': 0.0004968199780298855, 'samples': 1828416, 'steps': 9522, 'loss/train': 1.8859481811523438}} +11/06/2021 22:34:20 - INFO - __main__ - Step 9523: {'lr': 0.0004968199780298855, 'samples': 1828416, 'steps': 9522, 'loss/train': 1.8859481811523438}} +11/06/2021 22:34:24 - INFO - __main__ - Step 9531: {'lr': 0.0004968132246427212, 'samples': 1829952, 'steps': 9530, 'loss/train': 2.275637149810791}}} +11/06/2021 22:34:26 - INFO - __main__ - Step 9535: {'lr': 0.0004968098452800815, 'samples': 1830720, 'steps': 9534, 'loss/train': 1.9174106121063232}} +11/06/2021 22:34:26 - INFO - __main__ - Step 9535: {'lr': 0.0004968098452800815, 'samples': 1830720, 'steps': 9534, 'loss/train': 1.9174106121063232}} +11/06/2021 22:34:30 - INFO - __main__ - Step 9542: {'lr': 0.0004968039271139412, 'samples': 1832064, 'steps': 9541, 'loss/train': 2.009514331817627}}} +11/06/2021 22:34:31 - INFO - __main__ - Step 9546: {'lr': 0.0004968005428581767, 'samples': 1832832, 'steps': 9545, 'loss/train': 2.1240222454071045}} +11/06/2021 22:34:33 - INFO - __main__ - Step 9550: {'lr': 0.0004967971568231402, 'samples': 1833600, 'steps': 9549, 'loss/train': 1.5235668420791626}} +11/06/2021 22:34:36 - INFO - __main__ - Step 9555: {'lr': 0.0004967929217772801, 'samples': 1834560, 'steps': 9554, 'loss/train': 2.0895955562591553}} +11/06/2021 22:34:38 - INFO - __main__ - Step 9559: {'lr': 0.0004967895317389702, 'samples': 1835328, 'steps': 9558, 'loss/train': 1.6342477798461914}} +11/06/2021 22:34:40 - INFO - __main__ - Step 9563: {'lr': 0.0004967861399214674, 'samples': 1836096, 'steps': 9562, 'loss/train': 1.7751929759979248}} +11/06/2021 22:34:41 - INFO - __main__ - Step 9567: {'lr': 0.0004967827463247962, 'samples': 1836864, 'steps': 9566, 'loss/train': 1.7700427770614624}} +11/06/2021 22:34:43 - INFO - __main__ - Step 9571: {'lr': 0.0004967793509489811, 'samples': 1837632, 'steps': 9570, 'loss/train': 2.0516250133514404}} +11/06/2021 22:34:46 - INFO - __main__ - Step 9576: {'lr': 0.0004967751042273282, 'samples': 1838592, 'steps': 9575, 'loss/train': 2.606065273284912}}} +11/06/2021 22:34:48 - INFO - __main__ - Step 9580: {'lr': 0.0004967717048485287, 'samples': 1839360, 'steps': 9579, 'loss/train': 2.031545400619507}}} +11/06/2021 22:34:50 - INFO - __main__ - Step 9584: {'lr': 0.0004967683036906648, 'samples': 1840128, 'steps': 9583, 'loss/train': 2.204907178878784}}} +11/06/2021 22:34:51 - INFO - __main__ - Step 9588: {'lr': 0.0004967649007537611, 'samples': 1840896, 'steps': 9587, 'loss/train': 1.3074101209640503}} +11/06/2021 22:34:53 - INFO - __main__ - Step 9592: {'lr': 0.0004967614960378421, 'samples': 1841664, 'steps': 9591, 'loss/train': 2.0305135250091553}} +11/06/2021 22:34:56 - INFO - __main__ - Step 9597: {'lr': 0.0004967572376412405, 'samples': 1842624, 'steps': 9596, 'loss/train': 1.8701852560043335}} +11/06/2021 22:34:56 - INFO - __main__ - Step 9597: {'lr': 0.0004967572376412405, 'samples': 1842624, 'steps': 9596, 'loss/train': 1.8701852560043335}} +11/06/2021 22:34:59 - INFO - __main__ - Step 9604: {'lr': 0.0004967512712162387, 'samples': 1843968, 'steps': 9603, 'loss/train': 1.7263696193695068}} +11/06/2021 22:35:02 - INFO - __main__ - Step 9609: {'lr': 0.0004967470061486175, 'samples': 1844928, 'steps': 9608, 'loss/train': 1.621782660484314}}} +11/06/2021 22:35:04 - INFO - __main__ - Step 9613: {'lr': 0.0004967435920932711, 'samples': 1845696, 'steps': 9612, 'loss/train': 1.8796131610870361}} +11/06/2021 22:35:06 - INFO - __main__ - Step 9617: {'lr': 0.0004967401762590631, 'samples': 1846464, 'steps': 9616, 'loss/train': 1.674919605255127}}} +11/06/2021 22:35:06 - INFO - __main__ - Step 9617: {'lr': 0.0004967401762590631, 'samples': 1846464, 'steps': 9616, 'loss/train': 1.674919605255127}}} +11/06/2021 22:35:09 - INFO - __main__ - Step 9624: {'lr': 0.0004967341942688872, 'samples': 1847808, 'steps': 9623, 'loss/train': 1.75148344039917}}}} +11/06/2021 22:35:12 - INFO - __main__ - Step 9629: {'lr': 0.0004967299180835153, 'samples': 1848768, 'steps': 9628, 'loss/train': 1.4124494791030884}} +11/06/2021 22:35:14 - INFO - __main__ - Step 9634: {'lr': 0.0004967256391188258, 'samples': 1849728, 'steps': 9633, 'loss/train': 1.9075095653533936}} +11/06/2021 22:35:14 - INFO - __main__ - Step 9634: {'lr': 0.0004967256391188258, 'samples': 1849728, 'steps': 9633, 'loss/train': 1.9075095653533936}} +11/06/2021 22:35:18 - INFO - __main__ - Step 9641: {'lr': 0.0004967196438990995, 'samples': 1851072, 'steps': 9640, 'loss/train': 1.3965966701507568}} +11/06/2021 22:35:20 - INFO - __main__ - Step 9646: {'lr': 0.0004967153582642452, 'samples': 1852032, 'steps': 9645, 'loss/train': 5.934883117675781}}} +11/06/2021 22:35:22 - INFO - __main__ - Step 9650: {'lr': 0.0004967119277553692, 'samples': 1852800, 'steps': 9649, 'loss/train': 1.5039646625518799}} +11/06/2021 22:35:24 - INFO - __main__ - Step 9654: {'lr': 0.0004967084954678597, 'samples': 1853568, 'steps': 9653, 'loss/train': 2.3092923164367676}} +11/06/2021 22:35:26 - INFO - __main__ - Step 9658: {'lr': 0.0004967050614017415, 'samples': 1854336, 'steps': 9657, 'loss/train': 2.276421546936035}}} +11/06/2021 22:35:28 - INFO - __main__ - Step 9662: {'lr': 0.0004967016255570394, 'samples': 1855104, 'steps': 9661, 'loss/train': 1.8968331813812256}} +11/06/2021 22:35:30 - INFO - __main__ - Step 9667: {'lr': 0.0004966973282500661, 'samples': 1856064, 'steps': 9666, 'loss/train': 1.8805911540985107}} +11/06/2021 22:35:32 - INFO - __main__ - Step 9671: {'lr': 0.0004966938884036408, 'samples': 1856832, 'steps': 9670, 'loss/train': 1.8533520698547363}} +11/06/2021 22:35:35 - INFO - __main__ - Step 9675: {'lr': 0.0004966904467787123, 'samples': 1857600, 'steps': 9674, 'loss/train': 1.5391348600387573}} +11/06/2021 22:35:35 - INFO - __main__ - Step 9675: {'lr': 0.0004966904467787123, 'samples': 1857600, 'steps': 9674, 'loss/train': 1.5391348600387573}} +11/06/2021 22:35:38 - INFO - __main__ - Step 9682: {'lr': 0.0004966844196556382, 'samples': 1858944, 'steps': 9681, 'loss/train': 1.113672137260437}}} +11/06/2021 22:35:40 - INFO - __main__ - Step 9687: {'lr': 0.0004966801112331545, 'samples': 1859904, 'steps': 9686, 'loss/train': 1.8079742193222046}} +11/06/2021 22:35:42 - INFO - __main__ - Step 9691: {'lr': 0.0004966766624944607, 'samples': 1860672, 'steps': 9690, 'loss/train': 1.839411735534668}}} +11/06/2021 22:35:44 - INFO - __main__ - Step 9695: {'lr': 0.0004966732119773879, 'samples': 1861440, 'steps': 9694, 'loss/train': 1.997467279434204}}} +11/06/2021 22:35:46 - INFO - __main__ - Step 9699: {'lr': 0.0004966697596819607, 'samples': 1862208, 'steps': 9698, 'loss/train': 1.9859890937805176}} +11/06/2021 22:35:48 - INFO - __main__ - Step 9703: {'lr': 0.0004966663056082041, 'samples': 1862976, 'steps': 9702, 'loss/train': 2.0231058597564697}} +11/06/2021 22:35:50 - INFO - __main__ - Step 9708: {'lr': 0.0004966619855152706, 'samples': 1863936, 'steps': 9707, 'loss/train': 1.6858545541763306}} +11/06/2021 22:35:53 - INFO - __main__ - Step 9713: {'lr': 0.000496657662643785, 'samples': 1864896, 'steps': 9712, 'loss/train': 1.2711286544799805}}} +11/06/2021 22:35:53 - INFO - __main__ - Step 9713: {'lr': 0.000496657662643785, 'samples': 1864896, 'steps': 9712, 'loss/train': 1.2711286544799805}}} +11/06/2021 22:35:56 - INFO - __main__ - Step 9720: {'lr': 0.0004966516059558304, 'samples': 1866240, 'steps': 9719, 'loss/train': 1.9591999053955078}} +11/06/2021 22:35:58 - INFO - __main__ - Step 9724: {'lr': 0.0004966481425462533, 'samples': 1867008, 'steps': 9723, 'loss/train': 2.0228872299194336}} +11/06/2021 22:36:01 - INFO - __main__ - Step 9730: {'lr': 0.00049664294409782, 'samples': 1868160, 'steps': 9729, 'loss/train': 1.442859172821045}36}} +11/06/2021 22:36:01 - INFO - __main__ - Step 9730: {'lr': 0.00049664294409782, 'samples': 1868160, 'steps': 9729, 'loss/train': 1.442859172821045}36}} +11/06/2021 22:36:05 - INFO - __main__ - Step 9737: {'lr': 0.0004966368741847461, 'samples': 1869504, 'steps': 9736, 'loss/train': 1.5357730388641357}} +11/06/2021 22:36:06 - INFO - __main__ - Step 9741: {'lr': 0.000496633403218104, 'samples': 1870272, 'steps': 9740, 'loss/train': 1.855295181274414}7}} +11/06/2021 22:36:08 - INFO - __main__ - Step 9745: {'lr': 0.0004966299304733947, 'samples': 1871040, 'steps': 9744, 'loss/train': 1.8761732578277588}} +11/06/2021 22:36:10 - INFO - __main__ - Step 9750: {'lr': 0.000496625587042139, 'samples': 1872000, 'steps': 9749, 'loss/train': 1.5603324174880981}}} +11/06/2021 22:36:13 - INFO - __main__ - Step 9755: {'lr': 0.0004966212408327412, 'samples': 1872960, 'steps': 9754, 'loss/train': 1.7627856731414795}} +11/06/2021 22:36:13 - INFO - __main__ - Step 9755: {'lr': 0.0004966212408327412, 'samples': 1872960, 'steps': 9754, 'loss/train': 1.7627856731414795}} +11/06/2021 22:36:16 - INFO - __main__ - Step 9761: {'lr': 0.0004966160217143852, 'samples': 1874112, 'steps': 9760, 'loss/train': 1.4507635831832886}} +11/06/2021 22:36:18 - INFO - __main__ - Step 9766: {'lr': 0.0004966116693932472, 'samples': 1875072, 'steps': 9765, 'loss/train': 2.1143555641174316}} +11/06/2021 22:36:18 - INFO - __main__ - Step 9766: {'lr': 0.0004966116693932472, 'samples': 1875072, 'steps': 9765, 'loss/train': 2.1143555641174316}} +11/06/2021 22:36:22 - INFO - __main__ - Step 9774: {'lr': 0.0004966046999012373, 'samples': 1876608, 'steps': 9773, 'loss/train': 1.0785945653915405}} +11/06/2021 22:36:24 - INFO - __main__ - Step 9778: {'lr': 0.0004966012124884292, 'samples': 1877376, 'steps': 9777, 'loss/train': 1.7784291505813599}} +11/06/2021 22:36:26 - INFO - __main__ - Step 9782: {'lr': 0.0004965977232977861, 'samples': 1878144, 'steps': 9781, 'loss/train': 1.0429720878601074}} +11/06/2021 22:36:28 - INFO - __main__ - Step 9787: {'lr': 0.0004965933593094395, 'samples': 1879104, 'steps': 9786, 'loss/train': 1.8389208316802979}} +11/06/2021 22:36:30 - INFO - __main__ - Step 9792: {'lr': 0.000496588992543314, 'samples': 1880064, 'steps': 9791, 'loss/train': 1.8304022550582886}}} +11/06/2021 22:36:30 - INFO - __main__ - Step 9792: {'lr': 0.000496588992543314, 'samples': 1880064, 'steps': 9791, 'loss/train': 1.8304022550582886}}} +11/06/2021 22:36:35 - INFO - __main__ - Step 9799: {'lr': 0.000496582874404163, 'samples': 1881408, 'steps': 9798, 'loss/train': 0.2936389148235321}}} +11/06/2021 22:36:36 - INFO - __main__ - Step 9803: {'lr': 0.0004965793758802978, 'samples': 1882176, 'steps': 9802, 'loss/train': 1.732246994972229}}} +11/06/2021 22:36:38 - INFO - __main__ - Step 9807: {'lr': 0.000496575875578755, 'samples': 1882944, 'steps': 9806, 'loss/train': 2.212789535522461}}}} +11/06/2021 22:36:40 - INFO - __main__ - Step 9812: {'lr': 0.0004965714977020053, 'samples': 1883904, 'steps': 9811, 'loss/train': 1.6284079551696777}} +11/06/2021 22:36:42 - INFO - __main__ - Step 9816: {'lr': 0.0004965679934007797, 'samples': 1884672, 'steps': 9815, 'loss/train': 1.7675822973251343}} +11/06/2021 22:36:45 - INFO - __main__ - Step 9820: {'lr': 0.0004965644873219583, 'samples': 1885440, 'steps': 9819, 'loss/train': 1.5804340839385986}} +11/06/2021 22:36:46 - INFO - __main__ - Step 9824: {'lr': 0.0004965609794655664, 'samples': 1886208, 'steps': 9823, 'loss/train': 1.8378883600234985}} +11/06/2021 22:36:48 - INFO - __main__ - Step 9828: {'lr': 0.0004965574698316294, 'samples': 1886976, 'steps': 9827, 'loss/train': 1.9440776109695435}} +11/06/2021 22:36:50 - INFO - __main__ - Step 9833: {'lr': 0.0004965530802895738, 'samples': 1887936, 'steps': 9832, 'loss/train': 1.8684687614440918}} +11/06/2021 22:36:50 - INFO - __main__ - Step 9833: {'lr': 0.0004965530802895738, 'samples': 1887936, 'steps': 9832, 'loss/train': 1.8684687614440918}} +11/06/2021 22:36:54 - INFO - __main__ - Step 9840: {'lr': 0.0004965469302648005, 'samples': 1889280, 'steps': 9839, 'loss/train': 2.1997225284576416}} +11/06/2021 22:36:56 - INFO - __main__ - Step 9844: {'lr': 0.000496543413520936, 'samples': 1890048, 'steps': 9843, 'loss/train': 1.9805771112442017}}} +11/06/2021 22:36:59 - INFO - __main__ - Step 9849: {'lr': 0.0004965390150916136, 'samples': 1891008, 'steps': 9848, 'loss/train': 1.9253339767456055}} +11/06/2021 22:37:01 - INFO - __main__ - Step 9853: {'lr': 0.000496535494348593, 'samples': 1891776, 'steps': 9852, 'loss/train': 1.9677116870880127}}} +11/06/2021 22:37:01 - INFO - __main__ - Step 9853: {'lr': 0.000496535494348593, 'samples': 1891776, 'steps': 9852, 'loss/train': 1.9677116870880127}}} +11/06/2021 22:37:04 - INFO - __main__ - Step 9860: {'lr': 0.0004965293287715464, 'samples': 1893120, 'steps': 9859, 'loss/train': 1.8850369453430176}} +11/06/2021 22:37:04 - INFO - __main__ - Step 9860: {'lr': 0.0004965293287715464, 'samples': 1893120, 'steps': 9859, 'loss/train': 1.8850369453430176}} +11/06/2021 22:37:08 - INFO - __main__ - Step 9867: {'lr': 0.0004965231577514666, 'samples': 1894464, 'steps': 9866, 'loss/train': 2.018059253692627}}} +11/06/2021 22:37:11 - INFO - __main__ - Step 9873: {'lr': 0.0004965178639735772, 'samples': 1895616, 'steps': 9872, 'loss/train': 1.981247067451477}}} +11/06/2021 22:37:13 - INFO - __main__ - Step 9877: {'lr': 0.0004965143325667692, 'samples': 1896384, 'steps': 9876, 'loss/train': 2.1641268730163574}} +11/06/2021 22:37:15 - INFO - __main__ - Step 9881: {'lr': 0.0004965107993827524, 'samples': 1897152, 'steps': 9880, 'loss/train': 1.8044612407684326}} +11/06/2021 22:37:17 - INFO - __main__ - Step 9885: {'lr': 0.0004965072644215522, 'samples': 1897920, 'steps': 9884, 'loss/train': 1.9941020011901855}} +11/06/2021 22:37:18 - INFO - __main__ - Step 9889: {'lr': 0.0004965037276831942, 'samples': 1898688, 'steps': 9888, 'loss/train': 1.0114924907684326}} +11/06/2021 22:37:20 - INFO - __main__ - Step 9893: {'lr': 0.0004965001891677037, 'samples': 1899456, 'steps': 9892, 'loss/train': 1.4711591005325317}} +11/06/2021 22:37:20 - INFO - __main__ - Step 9893: {'lr': 0.0004965001891677037, 'samples': 1899456, 'steps': 9892, 'loss/train': 1.4711591005325317}} +11/06/2021 22:37:24 - INFO - __main__ - Step 9900: {'lr': 0.0004964939924894472, 'samples': 1900800, 'steps': 9899, 'loss/train': 1.5659464597702026}} +11/06/2021 22:37:26 - INFO - __main__ - Step 9905: {'lr': 0.0004964895629586928, 'samples': 1901760, 'steps': 9904, 'loss/train': 2.2174274921417236}} +11/06/2021 22:37:29 - INFO - __main__ - Step 9909: {'lr': 0.000496486017334928, 'samples': 1902528, 'steps': 9908, 'loss/train': 2.083883047103882}6}} +11/06/2021 22:37:31 - INFO - __main__ - Step 9913: {'lr': 0.0004964824699341582, 'samples': 1903296, 'steps': 9912, 'loss/train': 1.807940125465393}}} +11/06/2021 22:37:32 - INFO - __main__ - Step 9917: {'lr': 0.0004964789207564094, 'samples': 1904064, 'steps': 9916, 'loss/train': 1.8686342239379883}} +11/06/2021 22:37:34 - INFO - __main__ - Step 9921: {'lr': 0.0004964753698017071, 'samples': 1904832, 'steps': 9920, 'loss/train': 1.6933525800704956}} +11/06/2021 22:37:37 - INFO - __main__ - Step 9926: {'lr': 0.0004964709286095271, 'samples': 1905792, 'steps': 9925, 'loss/train': 1.6846635341644287}} +11/06/2021 22:37:38 - INFO - __main__ - Step 9930: {'lr': 0.0004964673736567728, 'samples': 1906560, 'steps': 9929, 'loss/train': 1.7367271184921265}} +11/06/2021 22:37:38 - INFO - __main__ - Step 9930: {'lr': 0.0004964673736567728, 'samples': 1906560, 'steps': 9929, 'loss/train': 1.7367271184921265}} +11/06/2021 22:37:42 - INFO - __main__ - Step 9937: {'lr': 0.000496461148213874, 'samples': 1907904, 'steps': 9936, 'loss/train': 2.6705877780914307}}} +11/06/2021 22:37:44 - INFO - __main__ - Step 9942: {'lr': 0.0004964566981373905, 'samples': 1908864, 'steps': 9941, 'loss/train': 1.5615383386611938}} +11/06/2021 22:37:47 - INFO - __main__ - Step 9947: {'lr': 0.0004964522452846675, 'samples': 1909824, 'steps': 9946, 'loss/train': 1.8149683475494385}} +11/06/2021 22:37:47 - INFO - __main__ - Step 9947: {'lr': 0.0004964522452846675, 'samples': 1909824, 'steps': 9946, 'loss/train': 1.8149683475494385}} +11/06/2021 22:37:50 - INFO - __main__ - Step 9954: {'lr': 0.0004964460066268681, 'samples': 1911168, 'steps': 9953, 'loss/train': 1.9778108596801758}} +11/06/2021 22:37:52 - INFO - __main__ - Step 9958: {'lr': 0.0004964424392365604, 'samples': 1911936, 'steps': 9957, 'loss/train': 2.3807883262634277}} +11/06/2021 22:37:55 - INFO - __main__ - Step 9963: {'lr': 0.0004964379775002078, 'samples': 1912896, 'steps': 9962, 'loss/train': 2.360861301422119}}} +11/06/2021 22:37:57 - INFO - __main__ - Step 9968: {'lr': 0.0004964335129878264, 'samples': 1913856, 'steps': 9967, 'loss/train': 1.1940803527832031}} +11/06/2021 22:37:57 - INFO - __main__ - Step 9968: {'lr': 0.0004964335129878264, 'samples': 1913856, 'steps': 9967, 'loss/train': 1.1940803527832031}} +11/06/2021 22:38:00 - INFO - __main__ - Step 9975: {'lr': 0.0004964272580068599, 'samples': 1915200, 'steps': 9974, 'loss/train': 1.6218897104263306}} +11/06/2021 22:38:02 - INFO - __main__ - Step 9979: {'lr': 0.000496423681289214, 'samples': 1915968, 'steps': 9978, 'loss/train': 1.7776697874069214}}} +11/06/2021 22:38:05 - INFO - __main__ - Step 9984: {'lr': 0.0004964192078938788, 'samples': 1916928, 'steps': 9983, 'loss/train': 2.1289093494415283}} +11/06/2021 22:38:05 - INFO - __main__ - Step 9984: {'lr': 0.0004964192078938788, 'samples': 1916928, 'steps': 9983, 'loss/train': 2.1289093494415283}} +11/06/2021 22:38:09 - INFO - __main__ - Step 9992: {'lr': 0.0004964120446876633, 'samples': 1918464, 'steps': 9991, 'loss/train': 1.8245000839233398}} +11/06/2021 22:38:11 - INFO - __main__ - Step 9996: {'lr': 0.0004964084604198354, 'samples': 1919232, 'steps': 9995, 'loss/train': 1.9137816429138184}} +11/06/2021 22:38:12 - INFO - __main__ - Step 10000: {'lr': 0.0004964048743755621, 'samples': 1920000, 'steps': 9999, 'loss/train': 1.2586203813552856} +11/06/2021 22:38:15 - INFO - __main__ - Step 10005: {'lr': 0.000496400389322133, 'samples': 1920960, 'steps': 10004, 'loss/train': 1.6377642154693604} +11/06/2021 22:38:17 - INFO - __main__ - Step 10009: {'lr': 0.0004963967992809516, 'samples': 1921728, 'steps': 10008, 'loss/train': 1.7431193590164185} +11/06/2021 22:38:19 - INFO - __main__ - Step 10013: {'lr': 0.0004963932074634087, 'samples': 1922496, 'steps': 10012, 'loss/train': 1.3404390811920166} +11/06/2021 22:38:21 - INFO - __main__ - Step 10017: {'lr': 0.00049638961386953, 'samples': 1923264, 'steps': 10016, 'loss/train': 1.4850966930389404}6} +11/06/2021 22:38:22 - INFO - __main__ - Step 10021: {'lr': 0.0004963860184993416, 'samples': 1924032, 'steps': 10020, 'loss/train': 1.717958688735962}} +11/06/2021 22:38:24 - INFO - __main__ - Step 10025: {'lr': 0.0004963824213528696, 'samples': 1924800, 'steps': 10024, 'loss/train': 1.9384859800338745} +11/06/2021 22:38:27 - INFO - __main__ - Step 10030: {'lr': 0.0004963779224219197, 'samples': 1925760, 'steps': 10029, 'loss/train': 1.7997504472732544} +11/06/2021 22:38:29 - INFO - __main__ - Step 10034: {'lr': 0.0004963743212789038, 'samples': 1926528, 'steps': 10033, 'loss/train': 2.0401864051818848} +11/06/2021 22:38:29 - INFO - __main__ - Step 10034: {'lr': 0.0004963743212789038, 'samples': 1926528, 'steps': 10033, 'loss/train': 2.0401864051818848} +11/06/2021 22:38:32 - INFO - __main__ - Step 10041: {'lr': 0.0004963680150046618, 'samples': 1927872, 'steps': 10040, 'loss/train': 1.8479679822921753} +11/06/2021 22:38:35 - INFO - __main__ - Step 10046: {'lr': 0.0004963635071927633, 'samples': 1928832, 'steps': 10045, 'loss/train': 1.261295199394226}} +11/06/2021 22:38:37 - INFO - __main__ - Step 10051: {'lr': 0.000496358996605675, 'samples': 1929792, 'steps': 10050, 'loss/train': 1.9643739461898804}} +11/06/2021 22:38:39 - INFO - __main__ - Step 10055: {'lr': 0.0004963553861379018, 'samples': 1930560, 'steps': 10054, 'loss/train': 2.023212194442749}} +11/06/2021 22:38:41 - INFO - __main__ - Step 10059: {'lr': 0.0004963517738940656, 'samples': 1931328, 'steps': 10058, 'loss/train': 1.7526215314865112} +11/06/2021 22:38:42 - INFO - __main__ - Step 10063: {'lr': 0.0004963481598741925, 'samples': 1932096, 'steps': 10062, 'loss/train': 1.8724141120910645} +11/06/2021 22:38:45 - INFO - __main__ - Step 10067: {'lr': 0.0004963445440783086, 'samples': 1932864, 'steps': 10066, 'loss/train': 1.8763664960861206} +11/06/2021 22:38:47 - INFO - __main__ - Step 10072: {'lr': 0.0004963400218359781, 'samples': 1933824, 'steps': 10071, 'loss/train': 1.9994356632232666} +11/06/2021 22:38:49 - INFO - __main__ - Step 10076: {'lr': 0.000496336402044165, 'samples': 1934592, 'steps': 10075, 'loss/train': 1.838132619857788}6} +11/06/2021 22:38:51 - INFO - __main__ - Step 10080: {'lr': 0.0004963327804764257, 'samples': 1935360, 'steps': 10079, 'loss/train': 1.9088850021362305} +11/06/2021 22:38:53 - INFO - __main__ - Step 10084: {'lr': 0.0004963291571327866, 'samples': 1936128, 'steps': 10083, 'loss/train': 1.8040343523025513} +11/06/2021 22:38:55 - INFO - __main__ - Step 10088: {'lr': 0.0004963255320132735, 'samples': 1936896, 'steps': 10087, 'loss/train': 2.1118416786193848} +11/06/2021 22:38:57 - INFO - __main__ - Step 10093: {'lr': 0.0004963209981165993, 'samples': 1937856, 'steps': 10092, 'loss/train': 2.122255802154541}} +11/06/2021 22:38:59 - INFO - __main__ - Step 10097: {'lr': 0.0004963173690014656, 'samples': 1938624, 'steps': 10096, 'loss/train': 2.1923022270202637} +11/06/2021 22:39:01 - INFO - __main__ - Step 10101: {'lr': 0.0004963137381105431, 'samples': 1939392, 'steps': 10100, 'loss/train': 2.0459229946136475} +11/06/2021 22:39:01 - INFO - __main__ - Step 10101: {'lr': 0.0004963137381105431, 'samples': 1939392, 'steps': 10100, 'loss/train': 2.0459229946136475} +11/06/2021 22:39:05 - INFO - __main__ - Step 10108: {'lr': 0.0004963073797785153, 'samples': 1940736, 'steps': 10107, 'loss/train': 1.9007415771484375} +11/06/2021 22:39:05 - INFO - __main__ - Step 10108: {'lr': 0.0004963073797785153, 'samples': 1940736, 'steps': 10107, 'loss/train': 1.9007415771484375} +11/06/2021 22:39:08 - INFO - __main__ - Step 10115: {'lr': 0.0004963010160083546, 'samples': 1942080, 'steps': 10114, 'loss/train': 1.9651312828063965} +11/06/2021 22:39:11 - INFO - __main__ - Step 10120: {'lr': 0.0004962964671288484, 'samples': 1943040, 'steps': 10119, 'loss/train': 1.8889999389648438} +11/06/2021 22:39:11 - INFO - __main__ - Step 10120: {'lr': 0.0004962964671288484, 'samples': 1943040, 'steps': 10119, 'loss/train': 1.8889999389648438} +11/06/2021 22:39:15 - INFO - __main__ - Step 10128: {'lr': 0.0004962891831508359, 'samples': 1944576, 'steps': 10127, 'loss/train': 1.920640230178833}} +11/06/2021 22:39:17 - INFO - __main__ - Step 10132: {'lr': 0.000496285538498438, 'samples': 1945344, 'steps': 10131, 'loss/train': 1.649821162223816}}} +11/06/2021 22:39:19 - INFO - __main__ - Step 10136: {'lr': 0.0004962818920704805, 'samples': 1946112, 'steps': 10135, 'loss/train': 2.1492648124694824} +11/06/2021 22:39:21 - INFO - __main__ - Step 10141: {'lr': 0.0004962773315386935, 'samples': 1947072, 'steps': 10140, 'loss/train': 2.360720157623291}} +11/06/2021 22:39:23 - INFO - __main__ - Step 10145: {'lr': 0.0004962736811158236, 'samples': 1947840, 'steps': 10144, 'loss/train': 1.8755285739898682} +11/06/2021 22:39:23 - INFO - __main__ - Step 10145: {'lr': 0.0004962736811158236, 'samples': 1947840, 'steps': 10144, 'loss/train': 1.8755285739898682} +11/06/2021 22:39:27 - INFO - __main__ - Step 10153: {'lr': 0.0004962663749436883, 'samples': 1949376, 'steps': 10152, 'loss/train': 1.250434160232544}} +11/06/2021 22:39:29 - INFO - __main__ - Step 10157: {'lr': 0.0004962627191944756, 'samples': 1950144, 'steps': 10156, 'loss/train': 1.7389650344848633} +11/06/2021 22:39:31 - INFO - __main__ - Step 10162: {'lr': 0.0004962581470113138, 'samples': 1951104, 'steps': 10161, 'loss/train': 1.4758445024490356} +11/06/2021 22:39:31 - INFO - __main__ - Step 10162: {'lr': 0.0004962581470113138, 'samples': 1951104, 'steps': 10161, 'loss/train': 1.4758445024490356} +11/06/2021 22:39:35 - INFO - __main__ - Step 10170: {'lr': 0.00049625082574835, 'samples': 1952640, 'steps': 10169, 'loss/train': 1.8901619911193848}6} +11/06/2021 22:39:35 - INFO - __main__ - Step 10170: {'lr': 0.00049625082574835, 'samples': 1952640, 'steps': 10169, 'loss/train': 1.8901619911193848}6} +11/06/2021 22:39:39 - INFO - __main__ - Step 10177: {'lr': 0.0004962444138180164, 'samples': 1953984, 'steps': 10176, 'loss/train': 1.5094280242919922} +11/06/2021 22:39:41 - INFO - __main__ - Step 10183: {'lr': 0.0004962389135505217, 'samples': 1955136, 'steps': 10182, 'loss/train': 1.9149515628814697} +11/06/2021 22:39:43 - INFO - __main__ - Step 10187: {'lr': 0.0004962352444864904, 'samples': 1955904, 'steps': 10186, 'loss/train': 1.8243874311447144} +11/06/2021 22:39:43 - INFO - __main__ - Step 10187: {'lr': 0.0004962352444864904, 'samples': 1955904, 'steps': 10186, 'loss/train': 1.8243874311447144} +11/06/2021 22:39:47 - INFO - __main__ - Step 10194: {'lr': 0.0004962288193528846, 'samples': 1957248, 'steps': 10193, 'loss/train': 1.8837649822235107} +11/06/2021 22:39:49 - INFO - __main__ - Step 10198: {'lr': 0.0004962251454071259, 'samples': 1958016, 'steps': 10197, 'loss/train': 1.4461283683776855} +11/06/2021 22:39:49 - INFO - __main__ - Step 10198: {'lr': 0.0004962251454071259, 'samples': 1958016, 'steps': 10197, 'loss/train': 1.4461283683776855} +11/06/2021 22:39:53 - INFO - __main__ - Step 10205: {'lr': 0.000496218711730672, 'samples': 1959360, 'steps': 10204, 'loss/train': 1.5240142345428467}} +11/06/2021 22:39:56 - INFO - __main__ - Step 10211: {'lr': 0.0004962131928240972, 'samples': 1960512, 'steps': 10210, 'loss/train': 2.1297640800476074} +11/06/2021 22:39:58 - INFO - __main__ - Step 10215: {'lr': 0.0004962095113342445, 'samples': 1961280, 'steps': 10214, 'loss/train': 1.9678434133529663} +11/06/2021 22:40:00 - INFO - __main__ - Step 10219: {'lr': 0.0004962058280693805, 'samples': 1962048, 'steps': 10218, 'loss/train': 1.1909321546554565} +11/06/2021 22:40:00 - INFO - __main__ - Step 10219: {'lr': 0.0004962058280693805, 'samples': 1962048, 'steps': 10218, 'loss/train': 1.1909321546554565} +11/06/2021 22:40:03 - INFO - __main__ - Step 10226: {'lr': 0.0004961993780848276, 'samples': 1963392, 'steps': 10225, 'loss/train': 1.372536301612854}} +11/06/2021 22:40:05 - INFO - __main__ - Step 10231: {'lr': 0.0004961947676249864, 'samples': 1964352, 'steps': 10230, 'loss/train': 1.6913650035858154} +11/06/2021 22:40:08 - INFO - __main__ - Step 10236: {'lr': 0.0004961901543918563, 'samples': 1965312, 'steps': 10235, 'loss/train': 1.1824220418930054} +11/06/2021 22:40:10 - INFO - __main__ - Step 10240: {'lr': 0.0004961864618086188, 'samples': 1966080, 'steps': 10239, 'loss/train': 1.8443377017974854} +11/06/2021 22:40:10 - INFO - __main__ - Step 10240: {'lr': 0.0004961864618086188, 'samples': 1966080, 'steps': 10239, 'loss/train': 1.8443377017974854} +11/06/2021 22:40:13 - INFO - __main__ - Step 10247: {'lr': 0.0004961799955172483, 'samples': 1967424, 'steps': 10246, 'loss/train': 1.7437840700149536} +11/06/2021 22:40:15 - INFO - __main__ - Step 10252: {'lr': 0.0004961753734099425, 'samples': 1968384, 'steps': 10251, 'loss/train': 1.3765827417373657} +11/06/2021 22:40:18 - INFO - __main__ - Step 10257: {'lr': 0.0004961707485295659, 'samples': 1969344, 'steps': 10256, 'loss/train': 1.6465765237808228} +11/06/2021 22:40:18 - INFO - __main__ - Step 10257: {'lr': 0.0004961707485295659, 'samples': 1969344, 'steps': 10256, 'loss/train': 1.6465765237808228} +11/06/2021 22:40:21 - INFO - __main__ - Step 10263: {'lr': 0.0004961651950127343, 'samples': 1970496, 'steps': 10262, 'loss/train': 1.9414300918579102} +11/06/2021 22:40:23 - INFO - __main__ - Step 10268: {'lr': 0.0004961605640317858, 'samples': 1971456, 'steps': 10267, 'loss/train': 1.6062275171279907} +11/06/2021 22:40:23 - INFO - __main__ - Step 10268: {'lr': 0.0004961605640317858, 'samples': 1971456, 'steps': 10267, 'loss/train': 1.6062275171279907} +11/06/2021 22:40:23 - INFO - __main__ - Step 10268: {'lr': 0.0004961605640317858, 'samples': 1971456, 'steps': 10267, 'loss/train': 1.6062275171279907} +11/06/2021 22:40:29 - INFO - __main__ - Step 10279: {'lr': 0.0004961503661131515, 'samples': 1973568, 'steps': 10278, 'loss/train': 1.548420786857605}} +11/06/2021 22:40:31 - INFO - __main__ - Step 10283: {'lr': 0.0004961466544517267, 'samples': 1974336, 'steps': 10282, 'loss/train': 2.109795570373535}} +11/06/2021 22:40:31 - INFO - __main__ - Step 10283: {'lr': 0.0004961466544517267, 'samples': 1974336, 'steps': 10282, 'loss/train': 2.109795570373535}} +11/06/2021 22:40:35 - INFO - __main__ - Step 10292: {'lr': 0.0004961382967253335, 'samples': 1976064, 'steps': 10291, 'loss/train': 1.815101981163025}} +11/06/2021 22:40:37 - INFO - __main__ - Step 10296: {'lr': 0.0004961345792966926, 'samples': 1976832, 'steps': 10295, 'loss/train': 2.0797855854034424} +11/06/2021 22:40:39 - INFO - __main__ - Step 10300: {'lr': 0.0004961308600935807, 'samples': 1977600, 'steps': 10299, 'loss/train': 1.8009984493255615} +11/06/2021 22:40:41 - INFO - __main__ - Step 10305: {'lr': 0.0004961262085943815, 'samples': 1978560, 'steps': 10304, 'loss/train': 1.3772211074829102} +11/06/2021 22:40:41 - INFO - __main__ - Step 10305: {'lr': 0.0004961262085943815, 'samples': 1978560, 'steps': 10304, 'loss/train': 1.3772211074829102} +11/06/2021 22:40:45 - INFO - __main__ - Step 10312: {'lr': 0.0004961196918376864, 'samples': 1979904, 'steps': 10311, 'loss/train': 1.361377239227295}} +11/06/2021 22:40:47 - INFO - __main__ - Step 10316: {'lr': 0.0004961159655369582, 'samples': 1980672, 'steps': 10315, 'loss/train': 1.5698388814926147} +11/06/2021 22:40:49 - INFO - __main__ - Step 10320: {'lr': 0.0004961122374618933, 'samples': 1981440, 'steps': 10319, 'loss/train': 1.6604183912277222} +11/06/2021 22:40:51 - INFO - __main__ - Step 10326: {'lr': 0.0004961066420224729, 'samples': 1982592, 'steps': 10325, 'loss/train': 1.309130072593689}} +11/06/2021 22:40:54 - INFO - __main__ - Step 10330: {'lr': 0.0004961029095116833, 'samples': 1983360, 'steps': 10329, 'loss/train': 2.0712430477142334} +11/06/2021 22:40:54 - INFO - __main__ - Step 10330: {'lr': 0.0004961029095116833, 'samples': 1983360, 'steps': 10329, 'loss/train': 2.0712430477142334} +11/06/2021 22:40:57 - INFO - __main__ - Step 10337: {'lr': 0.000496096373348546, 'samples': 1984704, 'steps': 10336, 'loss/train': 1.792807936668396}4} +11/06/2021 22:40:59 - INFO - __main__ - Step 10341: {'lr': 0.0004960926359586535, 'samples': 1985472, 'steps': 10340, 'loss/train': 1.554911732673645}} +11/06/2021 22:41:01 - INFO - __main__ - Step 10346: {'lr': 0.0004960879617263664, 'samples': 1986432, 'steps': 10345, 'loss/train': 1.2233792543411255} +11/06/2021 22:41:01 - INFO - __main__ - Step 10346: {'lr': 0.0004960879617263664, 'samples': 1986432, 'steps': 10345, 'loss/train': 1.2233792543411255} +11/06/2021 22:41:01 - INFO - __main__ - Step 10346: {'lr': 0.0004960879617263664, 'samples': 1986432, 'steps': 10345, 'loss/train': 1.2233792543411255} +11/06/2021 22:41:07 - INFO - __main__ - Step 10357: {'lr': 0.0004960776686576663, 'samples': 1988544, 'steps': 10356, 'loss/train': 1.7053444385528564} +11/06/2021 22:41:09 - INFO - __main__ - Step 10362: {'lr': 0.0004960729855548895, 'samples': 1989504, 'steps': 10361, 'loss/train': 1.650147795677185}} +11/06/2021 22:41:12 - INFO - __main__ - Step 10367: {'lr': 0.0004960682996801956, 'samples': 1990464, 'steps': 10366, 'loss/train': 1.6244982481002808} +11/06/2021 22:41:12 - INFO - __main__ - Step 10367: {'lr': 0.0004960682996801956, 'samples': 1990464, 'steps': 10366, 'loss/train': 1.6244982481002808} +11/06/2021 22:41:15 - INFO - __main__ - Step 10374: {'lr': 0.0004960617347989036, 'samples': 1991808, 'steps': 10373, 'loss/train': 1.9511737823486328} +11/06/2021 22:41:15 - INFO - __main__ - Step 10374: {'lr': 0.0004960617347989036, 'samples': 1991808, 'steps': 10373, 'loss/train': 1.9511737823486328} +11/06/2021 22:41:19 - INFO - __main__ - Step 10380: {'lr': 0.0004960561034337975, 'samples': 1992960, 'steps': 10379, 'loss/train': 2.050475835800171}} +11/06/2021 22:41:21 - INFO - __main__ - Step 10385: {'lr': 0.0004960514075806387, 'samples': 1993920, 'steps': 10384, 'loss/train': 2.118435859680176}} +11/06/2021 22:41:23 - INFO - __main__ - Step 10389: {'lr': 0.0004960476489025037, 'samples': 1994688, 'steps': 10388, 'loss/train': 1.7955809831619263} +11/06/2021 22:41:23 - INFO - __main__ - Step 10389: {'lr': 0.0004960476489025037, 'samples': 1994688, 'steps': 10388, 'loss/train': 1.7955809831619263} +11/06/2021 22:41:27 - INFO - __main__ - Step 10396: {'lr': 0.0004960410669474708, 'samples': 1996032, 'steps': 10395, 'loss/train': 1.8390122652053833} +11/06/2021 22:41:29 - INFO - __main__ - Step 10400: {'lr': 0.0004960373033913289, 'samples': 1996800, 'steps': 10399, 'loss/train': 1.6192007064819336} +11/06/2021 22:41:31 - INFO - __main__ - Step 10405: {'lr': 0.0004960325964517912, 'samples': 1997760, 'steps': 10404, 'loss/train': 1.8894060850143433} +11/06/2021 22:41:31 - INFO - __main__ - Step 10405: {'lr': 0.0004960325964517912, 'samples': 1997760, 'steps': 10404, 'loss/train': 1.8894060850143433} +11/06/2021 22:41:36 - INFO - __main__ - Step 10413: {'lr': 0.0004960250595839111, 'samples': 1999296, 'steps': 10412, 'loss/train': 1.6633156538009644} +11/06/2021 22:41:37 - INFO - __main__ - Step 10417: {'lr': 0.0004960212884894353, 'samples': 2000064, 'steps': 10416, 'loss/train': 1.5149108171463013} +11/06/2021 22:41:39 - INFO - __main__ - Step 10421: {'lr': 0.0004960175156213051, 'samples': 2000832, 'steps': 10420, 'loss/train': 0.9687737226486206} +11/06/2021 22:41:42 - INFO - __main__ - Step 10426: {'lr': 0.0004960127970419822, 'samples': 2001792, 'steps': 10425, 'loss/train': 1.9231642484664917} +11/06/2021 22:41:44 - INFO - __main__ - Step 10430: {'lr': 0.0004960090201832293, 'samples': 2002560, 'steps': 10429, 'loss/train': 1.1784454584121704} +11/06/2021 22:41:46 - INFO - __main__ - Step 10434: {'lr': 0.0004960052415509103, 'samples': 2003328, 'steps': 10433, 'loss/train': 1.7110601663589478} +11/06/2021 22:41:47 - INFO - __main__ - Step 10438: {'lr': 0.0004960014611450527, 'samples': 2004096, 'steps': 10437, 'loss/train': 1.7718604803085327} +11/06/2021 22:41:49 - INFO - __main__ - Step 10442: {'lr': 0.0004959976789656838, 'samples': 2004864, 'steps': 10441, 'loss/train': 1.8617457151412964} +11/06/2021 22:41:52 - INFO - __main__ - Step 10447: {'lr': 0.0004959929487475138, 'samples': 2005824, 'steps': 10446, 'loss/train': 1.3970377445220947} +11/06/2021 22:41:54 - INFO - __main__ - Step 10451: {'lr': 0.0004959891625778438, 'samples': 2006592, 'steps': 10450, 'loss/train': 2.1753814220428467} +11/06/2021 22:41:54 - INFO - __main__ - Step 10451: {'lr': 0.0004959891625778438, 'samples': 2006592, 'steps': 10450, 'loss/train': 2.1753814220428467} +11/06/2021 22:41:58 - INFO - __main__ - Step 10458: {'lr': 0.0004959825325136396, 'samples': 2007936, 'steps': 10457, 'loss/train': 1.9572356939315796} +11/06/2021 22:42:00 - INFO - __main__ - Step 10463: {'lr': 0.000495977793428407, 'samples': 2008896, 'steps': 10462, 'loss/train': 1.9288679361343384}} +11/06/2021 22:42:02 - INFO - __main__ - Step 10467: {'lr': 0.0004959740001652102, 'samples': 2009664, 'steps': 10466, 'loss/train': 1.70595121383667}}} +11/06/2021 22:42:04 - INFO - __main__ - Step 10471: {'lr': 0.0004959702051286999, 'samples': 2010432, 'steps': 10470, 'loss/train': 2.0080511569976807} +11/06/2021 22:42:06 - INFO - __main__ - Step 10475: {'lr': 0.0004959664083189035, 'samples': 2011200, 'steps': 10474, 'loss/train': 1.8766359090805054} +11/06/2021 22:42:08 - INFO - __main__ - Step 10479: {'lr': 0.0004959626097358485, 'samples': 2011968, 'steps': 10478, 'loss/train': 1.7041106224060059} +11/06/2021 22:42:10 - INFO - __main__ - Step 10484: {'lr': 0.0004959578590134262, 'samples': 2012928, 'steps': 10483, 'loss/train': 1.7551143169403076} +11/06/2021 22:42:10 - INFO - __main__ - Step 10484: {'lr': 0.0004959578590134262, 'samples': 2012928, 'steps': 10483, 'loss/train': 1.7551143169403076} +11/06/2021 22:42:14 - INFO - __main__ - Step 10492: {'lr': 0.0004959502520946827, 'samples': 2014464, 'steps': 10491, 'loss/train': 2.1610023975372314} +11/06/2021 22:42:15 - INFO - __main__ - Step 10496: {'lr': 0.0004959464459755839, 'samples': 2015232, 'steps': 10495, 'loss/train': 1.2869349718093872} +11/06/2021 22:42:18 - INFO - __main__ - Step 10500: {'lr': 0.0004959426380833703, 'samples': 2016000, 'steps': 10499, 'loss/train': 1.6832598447799683} +11/06/2021 22:42:20 - INFO - __main__ - Step 10504: {'lr': 0.0004959388284180694, 'samples': 2016768, 'steps': 10503, 'loss/train': 2.1253671646118164} +11/06/2021 22:42:22 - INFO - __main__ - Step 10508: {'lr': 0.0004959350169797085, 'samples': 2017536, 'steps': 10507, 'loss/train': 1.786071538925171}} +11/06/2021 22:42:23 - INFO - __main__ - Step 10512: {'lr': 0.0004959312037683154, 'samples': 2018304, 'steps': 10511, 'loss/train': 1.6077988147735596} +11/06/2021 22:42:25 - INFO - __main__ - Step 10516: {'lr': 0.0004959273887839175, 'samples': 2019072, 'steps': 10515, 'loss/train': 1.4780120849609375} +11/06/2021 22:42:28 - INFO - __main__ - Step 10521: {'lr': 0.0004959226175601736, 'samples': 2020032, 'steps': 10520, 'loss/train': 1.7402362823486328} +11/06/2021 22:42:30 - INFO - __main__ - Step 10526: {'lr': 0.0004959178435662064, 'samples': 2020992, 'steps': 10525, 'loss/train': 3.172778606414795}} +11/06/2021 22:42:30 - INFO - __main__ - Step 10526: {'lr': 0.0004959178435662064, 'samples': 2020992, 'steps': 10525, 'loss/train': 3.172778606414795}} +11/06/2021 22:42:34 - INFO - __main__ - Step 10534: {'lr': 0.0004959101994139284, 'samples': 2022528, 'steps': 10533, 'loss/train': 1.9462462663650513} +11/06/2021 22:42:34 - INFO - __main__ - Step 10534: {'lr': 0.0004959101994139284, 'samples': 2022528, 'steps': 10533, 'loss/train': 1.9462462663650513} +11/06/2021 22:42:38 - INFO - __main__ - Step 10541: {'lr': 0.0004959035049635023, 'samples': 2023872, 'steps': 10540, 'loss/train': 0.9154389500617981} +11/06/2021 22:42:40 - INFO - __main__ - Step 10545: {'lr': 0.0004958996771256422, 'samples': 2024640, 'steps': 10544, 'loss/train': 1.765254259109497}} +11/06/2021 22:42:42 - INFO - __main__ - Step 10549: {'lr': 0.0004958958475150044, 'samples': 2025408, 'steps': 10548, 'loss/train': 1.9864680767059326} +11/06/2021 22:42:44 - INFO - __main__ - Step 10553: {'lr': 0.0004958920161316167, 'samples': 2026176, 'steps': 10552, 'loss/train': 1.855413556098938}} +11/06/2021 22:42:46 - INFO - __main__ - Step 10557: {'lr': 0.0004958881829755066, 'samples': 2026944, 'steps': 10556, 'loss/train': 2.26411771774292}}} +11/06/2021 22:42:46 - INFO - __main__ - Step 10557: {'lr': 0.0004958881829755066, 'samples': 2026944, 'steps': 10556, 'loss/train': 2.26411771774292}}} +11/06/2021 22:42:50 - INFO - __main__ - Step 10565: {'lr': 0.0004958805113452298, 'samples': 2028480, 'steps': 10564, 'loss/train': 1.6105812788009644} +11/06/2021 22:42:51 - INFO - __main__ - Step 10569: {'lr': 0.0004958766728711184, 'samples': 2029248, 'steps': 10568, 'loss/train': 1.380372166633606}} +11/06/2021 22:42:53 - INFO - __main__ - Step 10573: {'lr': 0.0004958728326243954, 'samples': 2030016, 'steps': 10572, 'loss/train': 1.5941991806030273} +11/06/2021 22:42:56 - INFO - __main__ - Step 10578: {'lr': 0.0004958680298232983, 'samples': 2030976, 'steps': 10577, 'loss/train': 1.4245156049728394} +11/06/2021 22:42:56 - INFO - __main__ - Step 10578: {'lr': 0.0004958680298232983, 'samples': 2030976, 'steps': 10577, 'loss/train': 1.4245156049728394} +11/06/2021 22:43:00 - INFO - __main__ - Step 10586: {'lr': 0.00049586033958078, 'samples': 2032512, 'steps': 10585, 'loss/train': 2.0318799018859863}4} +11/06/2021 22:43:01 - INFO - __main__ - Step 10590: {'lr': 0.0004958564918007659, 'samples': 2033280, 'steps': 10589, 'loss/train': 0.6293484568595886} +11/06/2021 22:43:04 - INFO - __main__ - Step 10594: {'lr': 0.0004958526422482857, 'samples': 2034048, 'steps': 10593, 'loss/train': 1.8704800605773926} +11/06/2021 22:43:06 - INFO - __main__ - Step 10599: {'lr': 0.0004958478278151969, 'samples': 2035008, 'steps': 10598, 'loss/train': 1.3910499811172485} +11/06/2021 22:43:08 - INFO - __main__ - Step 10603: {'lr': 0.000495843974274769, 'samples': 2035776, 'steps': 10602, 'loss/train': 1.4589587450027466}} +11/06/2021 22:43:08 - INFO - __main__ - Step 10603: {'lr': 0.000495843974274769, 'samples': 2035776, 'steps': 10602, 'loss/train': 1.4589587450027466}} +11/06/2021 22:43:11 - INFO - __main__ - Step 10610: {'lr': 0.0004958372263142571, 'samples': 2037120, 'steps': 10609, 'loss/train': 1.8919156789779663} +11/06/2021 22:43:11 - INFO - __main__ - Step 10610: {'lr': 0.0004958372263142571, 'samples': 2037120, 'steps': 10609, 'loss/train': 1.8919156789779663} +11/06/2021 22:43:15 - INFO - __main__ - Step 10616: {'lr': 0.0004958314380280504, 'samples': 2038272, 'steps': 10615, 'loss/train': 1.4865412712097168} +11/06/2021 22:43:18 - INFO - __main__ - Step 10622: {'lr': 0.0004958256457542011, 'samples': 2039424, 'steps': 10621, 'loss/train': 1.7138190269470215} +11/06/2021 22:43:18 - INFO - __main__ - Step 10622: {'lr': 0.0004958256457542011, 'samples': 2039424, 'steps': 10621, 'loss/train': 1.7138190269470215} +11/06/2021 22:43:22 - INFO - __main__ - Step 10629: {'lr': 0.0004958188830615649, 'samples': 2040768, 'steps': 10628, 'loss/train': 2.004051446914673}} +11/06/2021 22:43:24 - INFO - __main__ - Step 10634: {'lr': 0.0004958140492439502, 'samples': 2041728, 'steps': 10633, 'loss/train': 1.8917224407196045} +11/06/2021 22:43:26 - INFO - __main__ - Step 10639: {'lr': 0.0004958092126573352, 'samples': 2042688, 'steps': 10638, 'loss/train': 1.832000970840454}} +11/06/2021 22:43:26 - INFO - __main__ - Step 10639: {'lr': 0.0004958092126573352, 'samples': 2042688, 'steps': 10638, 'loss/train': 1.832000970840454}} +11/06/2021 22:43:30 - INFO - __main__ - Step 10646: {'lr': 0.0004958024367842569, 'samples': 2044032, 'steps': 10645, 'loss/train': 1.8402926921844482} +11/06/2021 22:43:32 - INFO - __main__ - Step 10650: {'lr': 0.0004957985624201688, 'samples': 2044800, 'steps': 10649, 'loss/train': 1.3269506692886353} +11/06/2021 22:43:34 - INFO - __main__ - Step 10655: {'lr': 0.0004957937169731186, 'samples': 2045760, 'steps': 10654, 'loss/train': 1.672598958015442}} +11/06/2021 22:43:36 - INFO - __main__ - Step 10659: {'lr': 0.0004957898386219603, 'samples': 2046528, 'steps': 10658, 'loss/train': 1.6076505184173584} +11/06/2021 22:43:36 - INFO - __main__ - Step 10659: {'lr': 0.0004957898386219603, 'samples': 2046528, 'steps': 10658, 'loss/train': 1.6076505184173584} +11/06/2021 22:43:40 - INFO - __main__ - Step 10666: {'lr': 0.0004957830472436097, 'samples': 2047872, 'steps': 10665, 'loss/train': 2.27144718170166}4} +11/06/2021 22:43:42 - INFO - __main__ - Step 10671: {'lr': 0.0004957781929366832, 'samples': 2048832, 'steps': 10670, 'loss/train': 2.503723382949829}} +11/06/2021 22:43:42 - INFO - __main__ - Step 10671: {'lr': 0.0004957781929366832, 'samples': 2048832, 'steps': 10670, 'loss/train': 2.503723382949829}} +11/06/2021 22:43:47 - INFO - __main__ - Step 10678: {'lr': 0.0004957713922557563, 'samples': 2050176, 'steps': 10677, 'loss/train': 1.6342339515686035} +11/06/2021 22:43:48 - INFO - __main__ - Step 10682: {'lr': 0.0004957675037160624, 'samples': 2050944, 'steps': 10681, 'loss/train': 1.979127049446106}} +11/06/2021 22:43:50 - INFO - __main__ - Step 10686: {'lr': 0.0004957636134045437, 'samples': 2051712, 'steps': 10685, 'loss/train': 1.5401474237442017} +11/06/2021 22:43:52 - INFO - __main__ - Step 10691: {'lr': 0.0004957587480235595, 'samples': 2052672, 'steps': 10690, 'loss/train': 1.7230714559555054} +11/06/2021 22:43:55 - INFO - __main__ - Step 10695: {'lr': 0.0004957548537255378, 'samples': 2053440, 'steps': 10694, 'loss/train': 2.194444417953491}} +11/06/2021 22:43:57 - INFO - __main__ - Step 10699: {'lr': 0.0004957509576557826, 'samples': 2054208, 'steps': 10698, 'loss/train': 1.7377288341522217} +11/06/2021 22:43:58 - INFO - __main__ - Step 10703: {'lr': 0.0004957470598143218, 'samples': 2054976, 'steps': 10702, 'loss/train': 1.4152930974960327} +11/06/2021 22:44:00 - INFO - __main__ - Step 10707: {'lr': 0.0004957431602011839, 'samples': 2055744, 'steps': 10706, 'loss/train': 1.5255722999572754} +11/06/2021 22:44:03 - INFO - __main__ - Step 10712: {'lr': 0.000495738283193383, 'samples': 2056704, 'steps': 10711, 'loss/train': 1.6758942604064941}} +11/06/2021 22:44:05 - INFO - __main__ - Step 10716: {'lr': 0.0004957343795940738, 'samples': 2057472, 'steps': 10715, 'loss/train': 2.222113847732544}} +11/06/2021 22:44:05 - INFO - __main__ - Step 10716: {'lr': 0.0004957343795940738, 'samples': 2057472, 'steps': 10715, 'loss/train': 2.222113847732544}} +11/06/2021 22:44:08 - INFO - __main__ - Step 10723: {'lr': 0.0004957275440324211, 'samples': 2058816, 'steps': 10722, 'loss/train': 1.7179454565048218} +11/06/2021 22:44:10 - INFO - __main__ - Step 10727: {'lr': 0.0004957236355613184, 'samples': 2059584, 'steps': 10726, 'loss/train': 1.7511495351791382} +11/06/2021 22:44:10 - INFO - __main__ - Step 10727: {'lr': 0.0004957236355613184, 'samples': 2059584, 'steps': 10726, 'loss/train': 1.7511495351791382} +11/06/2021 22:44:15 - INFO - __main__ - Step 10736: {'lr': 0.0004957148350243025, 'samples': 2061312, 'steps': 10735, 'loss/train': 2.2027082443237305} +11/06/2021 22:44:15 - INFO - __main__ - Step 10736: {'lr': 0.0004957148350243025, 'samples': 2061312, 'steps': 10735, 'loss/train': 2.2027082443237305} +11/06/2021 22:44:18 - INFO - __main__ - Step 10743: {'lr': 0.0004957079839621051, 'samples': 2062656, 'steps': 10742, 'loss/train': 2.051661968231201}} +11/06/2021 22:44:20 - INFO - __main__ - Step 10748: {'lr': 0.0004957030870248742, 'samples': 2063616, 'steps': 10747, 'loss/train': 1.2029649019241333} +11/06/2021 22:44:20 - INFO - __main__ - Step 10748: {'lr': 0.0004957030870248742, 'samples': 2063616, 'steps': 10747, 'loss/train': 1.2029649019241333} +11/06/2021 22:44:24 - INFO - __main__ - Step 10756: {'lr': 0.0004956952461684066, 'samples': 2065152, 'steps': 10755, 'loss/train': 2.1202139854431152} +11/06/2021 22:44:26 - INFO - __main__ - Step 10760: {'lr': 0.0004956913230832031, 'samples': 2065920, 'steps': 10759, 'loss/train': 2.134770154953003}} +11/06/2021 22:44:28 - INFO - __main__ - Step 10764: {'lr': 0.000495687398226724, 'samples': 2066688, 'steps': 10763, 'loss/train': 1.661841869354248}}} +11/06/2021 22:44:31 - INFO - __main__ - Step 10768: {'lr': 0.0004956834715989977, 'samples': 2067456, 'steps': 10767, 'loss/train': 1.8057781457901}}}} +11/06/2021 22:44:32 - INFO - __main__ - Step 10772: {'lr': 0.0004956795432000526, 'samples': 2068224, 'steps': 10771, 'loss/train': 1.9097800254821777} +11/06/2021 22:44:34 - INFO - __main__ - Step 10776: {'lr': 0.0004956756130299169, 'samples': 2068992, 'steps': 10775, 'loss/train': 1.20347261428833}7} +11/06/2021 22:44:36 - INFO - __main__ - Step 10781: {'lr': 0.0004956706978265536, 'samples': 2069952, 'steps': 10780, 'loss/train': 1.7361626625061035} +11/06/2021 22:44:38 - INFO - __main__ - Step 10785: {'lr': 0.0004956667636713427, 'samples': 2070720, 'steps': 10784, 'loss/train': 1.5868165493011475} +11/06/2021 22:44:40 - INFO - __main__ - Step 10789: {'lr': 0.0004956628277450333, 'samples': 2071488, 'steps': 10788, 'loss/train': 2.1454813480377197} +11/06/2021 22:44:43 - INFO - __main__ - Step 10793: {'lr': 0.0004956588900476538, 'samples': 2072256, 'steps': 10792, 'loss/train': 1.459761381149292}} +11/06/2021 22:44:44 - INFO - __main__ - Step 10797: {'lr': 0.0004956549505792327, 'samples': 2073024, 'steps': 10796, 'loss/train': 2.264521360397339}} +11/06/2021 22:44:46 - INFO - __main__ - Step 10801: {'lr': 0.0004956510093397983, 'samples': 2073792, 'steps': 10800, 'loss/train': 1.6848071813583374} +11/06/2021 22:44:46 - INFO - __main__ - Step 10801: {'lr': 0.0004956510093397983, 'samples': 2073792, 'steps': 10800, 'loss/train': 1.6848071813583374} +11/06/2021 22:44:51 - INFO - __main__ - Step 10810: {'lr': 0.0004956421350759508, 'samples': 2075520, 'steps': 10809, 'loss/train': 1.3117084503173828} +11/06/2021 22:44:53 - INFO - __main__ - Step 10814: {'lr': 0.0004956381880809195, 'samples': 2076288, 'steps': 10813, 'loss/train': 2.0894155502319336} +11/06/2021 22:44:54 - INFO - __main__ - Step 10818: {'lr': 0.0004956342393149959, 'samples': 2077056, 'steps': 10817, 'loss/train': 1.7274878025054932} +11/06/2021 22:44:57 - INFO - __main__ - Step 10822: {'lr': 0.0004956302887782082, 'samples': 2077824, 'steps': 10821, 'loss/train': 1.0446696281433105} +11/06/2021 22:44:59 - INFO - __main__ - Step 10826: {'lr': 0.0004956263364705851, 'samples': 2078592, 'steps': 10825, 'loss/train': 1.6332308053970337} +11/06/2021 22:45:01 - INFO - __main__ - Step 10830: {'lr': 0.000495622382392155, 'samples': 2079360, 'steps': 10829, 'loss/train': 1.06633460521698}37} +11/06/2021 22:45:02 - INFO - __main__ - Step 10834: {'lr': 0.0004956184265429463, 'samples': 2080128, 'steps': 10833, 'loss/train': 2.010787010192871}} +11/06/2021 22:45:04 - INFO - __main__ - Step 10838: {'lr': 0.0004956144689229877, 'samples': 2080896, 'steps': 10837, 'loss/train': 2.1746902465820312} +11/06/2021 22:45:07 - INFO - __main__ - Step 10843: {'lr': 0.0004956095194079658, 'samples': 2081856, 'steps': 10842, 'loss/train': 1.8103166818618774} +11/06/2021 22:45:09 - INFO - __main__ - Step 10847: {'lr': 0.0004956055578039241, 'samples': 2082624, 'steps': 10846, 'loss/train': 1.727042317390442}} +11/06/2021 22:45:11 - INFO - __main__ - Step 10851: {'lr': 0.0004956015944292253, 'samples': 2083392, 'steps': 10850, 'loss/train': 2.1259398460388184} +11/06/2021 22:45:12 - INFO - __main__ - Step 10855: {'lr': 0.0004955976292838979, 'samples': 2084160, 'steps': 10854, 'loss/train': 1.4349844455718994} +11/06/2021 22:45:15 - INFO - __main__ - Step 10859: {'lr': 0.0004955936623679703, 'samples': 2084928, 'steps': 10858, 'loss/train': 2.2991316318511963} +11/06/2021 22:45:17 - INFO - __main__ - Step 10864: {'lr': 0.0004955887012331982, 'samples': 2085888, 'steps': 10863, 'loss/train': 1.7115322351455688} +11/06/2021 22:45:17 - INFO - __main__ - Step 10864: {'lr': 0.0004955887012331982, 'samples': 2085888, 'steps': 10863, 'loss/train': 1.7115322351455688} +11/06/2021 22:45:20 - INFO - __main__ - Step 10871: {'lr': 0.0004955817509968737, 'samples': 2087232, 'steps': 10870, 'loss/train': 1.3590363264083862} +11/06/2021 22:45:22 - INFO - __main__ - Step 10875: {'lr': 0.0004955777769988322, 'samples': 2088000, 'steps': 10874, 'loss/train': 2.0556890964508057} +11/06/2021 22:45:25 - INFO - __main__ - Step 10880: {'lr': 0.0004955728070115787, 'samples': 2088960, 'steps': 10879, 'loss/train': 1.9695255756378174} +11/06/2021 22:45:25 - INFO - __main__ - Step 10880: {'lr': 0.0004955728070115787, 'samples': 2088960, 'steps': 10879, 'loss/train': 1.9695255756378174} +11/06/2021 22:45:28 - INFO - __main__ - Step 10887: {'lr': 0.0004955658443820809, 'samples': 2090304, 'steps': 10886, 'loss/train': 1.9681472778320312} +11/06/2021 22:45:31 - INFO - __main__ - Step 10892: {'lr': 0.0004955608677558424, 'samples': 2091264, 'steps': 10891, 'loss/train': 1.5222508907318115} +11/06/2021 22:45:33 - INFO - __main__ - Step 10897: {'lr': 0.0004955558883634555, 'samples': 2092224, 'steps': 10896, 'loss/train': 2.1378374099731445} +11/06/2021 22:45:35 - INFO - __main__ - Step 10901: {'lr': 0.0004955519028579568, 'samples': 2092992, 'steps': 10900, 'loss/train': 1.904826045036316}} +11/06/2021 22:45:37 - INFO - __main__ - Step 10905: {'lr': 0.0004955479155821877, 'samples': 2093760, 'steps': 10904, 'loss/train': 1.7908188104629517} +11/06/2021 22:45:38 - INFO - __main__ - Step 10909: {'lr': 0.000495543926536177, 'samples': 2094528, 'steps': 10908, 'loss/train': 1.9852023124694824}} +11/06/2021 22:45:40 - INFO - __main__ - Step 10913: {'lr': 0.0004955399357199534, 'samples': 2095296, 'steps': 10912, 'loss/train': 1.5614092350006104} +11/06/2021 22:45:43 - INFO - __main__ - Step 10918: {'lr': 0.0004955349447103559, 'samples': 2096256, 'steps': 10917, 'loss/train': 1.4804587364196777} +11/06/2021 22:45:45 - INFO - __main__ - Step 10922: {'lr': 0.0004955309499112586, 'samples': 2097024, 'steps': 10921, 'loss/train': 1.534606695175171}} +11/06/2021 22:45:47 - INFO - __main__ - Step 10926: {'lr': 0.0004955269533420419, 'samples': 2097792, 'steps': 10925, 'loss/train': 1.5095373392105103} +11/06/2021 22:45:49 - INFO - __main__ - Step 10930: {'lr': 0.0004955229550027347, 'samples': 2098560, 'steps': 10929, 'loss/train': 1.7207810878753662} +11/06/2021 22:45:51 - INFO - __main__ - Step 10934: {'lr': 0.000495518954893366, 'samples': 2099328, 'steps': 10933, 'loss/train': 1.7026230096817017}} +11/06/2021 22:45:53 - INFO - __main__ - Step 10939: {'lr': 0.0004955139522675496, 'samples': 2100288, 'steps': 10938, 'loss/train': 2.6687307357788086} +11/06/2021 22:45:55 - INFO - __main__ - Step 10943: {'lr': 0.0004955099481756475, 'samples': 2101056, 'steps': 10942, 'loss/train': 2.186129331588745}} +11/06/2021 22:45:57 - INFO - __main__ - Step 10947: {'lr': 0.0004955059423137774, 'samples': 2101824, 'steps': 10946, 'loss/train': 1.8952678442001343} +11/06/2021 22:45:59 - INFO - __main__ - Step 10951: {'lr': 0.0004955019346819684, 'samples': 2102592, 'steps': 10950, 'loss/train': 1.7060812711715698} +11/06/2021 22:46:01 - INFO - __main__ - Step 10955: {'lr': 0.0004954979252802491, 'samples': 2103360, 'steps': 10954, 'loss/train': 1.854745626449585}} +11/06/2021 22:46:03 - INFO - __main__ - Step 10959: {'lr': 0.0004954939141086488, 'samples': 2104128, 'steps': 10958, 'loss/train': 1.2875730991363525} +11/06/2021 22:46:03 - INFO - __main__ - Step 10959: {'lr': 0.0004954939141086488, 'samples': 2104128, 'steps': 10958, 'loss/train': 1.2875730991363525} +11/06/2021 22:46:07 - INFO - __main__ - Step 10967: {'lr': 0.0004954858864559199, 'samples': 2105664, 'steps': 10966, 'loss/train': 2.002821922302246}} +11/06/2021 22:46:09 - INFO - __main__ - Step 10971: {'lr': 0.0004954818699748493, 'samples': 2106432, 'steps': 10970, 'loss/train': 1.9312834739685059} +11/06/2021 22:46:10 - INFO - __main__ - Step 10975: {'lr': 0.0004954778517240133, 'samples': 2107200, 'steps': 10974, 'loss/train': 1.7459683418273926} +11/06/2021 22:46:13 - INFO - __main__ - Step 10980: {'lr': 0.0004954728264217796, 'samples': 2108160, 'steps': 10979, 'loss/train': 1.738264560699463}} +11/06/2021 22:46:15 - INFO - __main__ - Step 10985: {'lr': 0.0004954677983543893, 'samples': 2109120, 'steps': 10984, 'loss/train': 1.65086829662323}}} +11/06/2021 22:46:17 - INFO - __main__ - Step 10989: {'lr': 0.0004954637739096023, 'samples': 2109888, 'steps': 10988, 'loss/train': 2.1266255378723145} +11/06/2021 22:46:17 - INFO - __main__ - Step 10989: {'lr': 0.0004954637739096023, 'samples': 2109888, 'steps': 10988, 'loss/train': 2.1266255378723145} +11/06/2021 22:46:21 - INFO - __main__ - Step 10996: {'lr': 0.0004954567268730582, 'samples': 2111232, 'steps': 10995, 'loss/train': 1.7507246732711792} +11/06/2021 22:46:23 - INFO - __main__ - Step 11000: {'lr': 0.0004954526975618447, 'samples': 2112000, 'steps': 10999, 'loss/train': 1.7559417486190796} +11/06/2021 22:46:25 - INFO - __main__ - Step 11004: {'lr': 0.0004954486664810762, 'samples': 2112768, 'steps': 11003, 'loss/train': 1.973361849784851}} +11/06/2021 22:46:27 - INFO - __main__ - Step 11008: {'lr': 0.0004954446336307814, 'samples': 2113536, 'steps': 11007, 'loss/train': 1.5346612930297852} +11/06/2021 22:46:29 - INFO - __main__ - Step 11012: {'lr': 0.0004954405990109897, 'samples': 2114304, 'steps': 11011, 'loss/train': 1.1053050756454468} +11/06/2021 22:46:31 - INFO - __main__ - Step 11016: {'lr': 0.0004954365626217299, 'samples': 2115072, 'steps': 11015, 'loss/train': 1.8625273704528809} +11/06/2021 22:46:31 - INFO - __main__ - Step 11016: {'lr': 0.0004954365626217299, 'samples': 2115072, 'steps': 11015, 'loss/train': 1.8625273704528809} +11/06/2021 22:46:34 - INFO - __main__ - Step 11023: {'lr': 0.0004954294946828308, 'samples': 2116416, 'steps': 11022, 'loss/train': 2.187809944152832}} +11/06/2021 22:46:37 - INFO - __main__ - Step 11029: {'lr': 0.0004954234321365998, 'samples': 2117568, 'steps': 11028, 'loss/train': 2.104278087615967}} +11/06/2021 22:46:39 - INFO - __main__ - Step 11033: {'lr': 0.0004954193882274261, 'samples': 2118336, 'steps': 11032, 'loss/train': 1.8850313425064087} +11/06/2021 22:46:41 - INFO - __main__ - Step 11037: {'lr': 0.0004954153425489374, 'samples': 2119104, 'steps': 11036, 'loss/train': 1.7933595180511475} +11/06/2021 22:46:43 - INFO - __main__ - Step 11041: {'lr': 0.0004954112951011628, 'samples': 2119872, 'steps': 11040, 'loss/train': 1.5636467933654785} +11/06/2021 22:46:45 - INFO - __main__ - Step 11045: {'lr': 0.0004954072458841315, 'samples': 2120640, 'steps': 11044, 'loss/train': 1.7006868124008179} +11/06/2021 22:46:47 - INFO - __main__ - Step 11049: {'lr': 0.0004954031948978729, 'samples': 2121408, 'steps': 11048, 'loss/train': 1.3999689817428589} +11/06/2021 22:46:49 - INFO - __main__ - Step 11054: {'lr': 0.0004953981286771178, 'samples': 2122368, 'steps': 11053, 'loss/train': 0.8524397015571594} +11/06/2021 22:46:49 - INFO - __main__ - Step 11054: {'lr': 0.0004953981286771178, 'samples': 2122368, 'steps': 11053, 'loss/train': 0.8524397015571594} +11/06/2021 22:46:52 - INFO - __main__ - Step 11060: {'lr': 0.0004953920455633206, 'samples': 2123520, 'steps': 11059, 'loss/train': 1.7199558019638062} +11/06/2021 22:46:54 - INFO - __main__ - Step 11064: {'lr': 0.000495387987942719, 'samples': 2124288, 'steps': 11063, 'loss/train': 1.8901044130325317}} +11/06/2021 22:46:57 - INFO - __main__ - Step 11069: {'lr': 0.0004953829134291895, 'samples': 2125248, 'steps': 11068, 'loss/train': 2.0392954349517822} +11/06/2021 22:46:59 - INFO - __main__ - Step 11074: {'lr': 0.0004953778361515163, 'samples': 2126208, 'steps': 11073, 'loss/train': 1.7177420854568481} +11/06/2021 22:47:01 - INFO - __main__ - Step 11078: {'lr': 0.0004953737723392324, 'samples': 2126976, 'steps': 11077, 'loss/train': 2.2842390537261963} +11/06/2021 22:47:03 - INFO - __main__ - Step 11082: {'lr': 0.0004953697067579624, 'samples': 2127744, 'steps': 11081, 'loss/train': 1.5058166980743408} +11/06/2021 22:47:05 - INFO - __main__ - Step 11086: {'lr': 0.0004953656394077355, 'samples': 2128512, 'steps': 11085, 'loss/train': 1.1860450506210327} +11/06/2021 22:47:07 - INFO - __main__ - Step 11090: {'lr': 0.0004953615702885812, 'samples': 2129280, 'steps': 11089, 'loss/train': 1.5646089315414429} +11/06/2021 22:47:09 - INFO - __main__ - Step 11095: {'lr': 0.0004953564814021285, 'samples': 2130240, 'steps': 11094, 'loss/train': 1.9974864721298218} +11/06/2021 22:47:11 - INFO - __main__ - Step 11099: {'lr': 0.0004953524083029945, 'samples': 2131008, 'steps': 11098, 'loss/train': 2.143897533416748}} +11/06/2021 22:47:13 - INFO - __main__ - Step 11103: {'lr': 0.0004953483334350283, 'samples': 2131776, 'steps': 11102, 'loss/train': 1.5690078735351562} +11/06/2021 22:47:15 - INFO - __main__ - Step 11107: {'lr': 0.0004953442567982593, 'samples': 2132544, 'steps': 11106, 'loss/train': 1.606833815574646}} +11/06/2021 22:47:17 - INFO - __main__ - Step 11111: {'lr': 0.0004953401783927171, 'samples': 2133312, 'steps': 11110, 'loss/train': 1.9979164600372314} +11/06/2021 22:47:19 - INFO - __main__ - Step 11116: {'lr': 0.0004953350778984963, 'samples': 2134272, 'steps': 11115, 'loss/train': 1.8427363634109497} +11/06/2021 22:47:21 - INFO - __main__ - Step 11120: {'lr': 0.0004953309955133214, 'samples': 2135040, 'steps': 11119, 'loss/train': 1.8152966499328613} +11/06/2021 22:47:23 - INFO - __main__ - Step 11124: {'lr': 0.0004953269113594687, 'samples': 2135808, 'steps': 11123, 'loss/train': 1.684847116470337}} +11/06/2021 22:47:23 - INFO - __main__ - Step 11124: {'lr': 0.0004953269113594687, 'samples': 2135808, 'steps': 11123, 'loss/train': 1.684847116470337}} +11/06/2021 22:47:26 - INFO - __main__ - Step 11131: {'lr': 0.0004953197598344342, 'samples': 2137152, 'steps': 11130, 'loss/train': 2.116920232772827}} +11/06/2021 22:47:29 - INFO - __main__ - Step 11136: {'lr': 0.0004953146482861385, 'samples': 2138112, 'steps': 11135, 'loss/train': 1.7565672397613525} +11/06/2021 22:47:31 - INFO - __main__ - Step 11141: {'lr': 0.000495309533974468, 'samples': 2139072, 'steps': 11140, 'loss/train': 1.7597218751907349}} +11/06/2021 22:47:33 - INFO - __main__ - Step 11145: {'lr': 0.0004953054405355404, 'samples': 2139840, 'steps': 11144, 'loss/train': 2.103456735610962}} +11/06/2021 22:47:33 - INFO - __main__ - Step 11145: {'lr': 0.0004953054405355404, 'samples': 2139840, 'steps': 11144, 'loss/train': 2.103456735610962}} +11/06/2021 22:47:36 - INFO - __main__ - Step 11152: {'lr': 0.0004952982727619973, 'samples': 2141184, 'steps': 11151, 'loss/train': 1.672674298286438}} +11/06/2021 22:47:39 - INFO - __main__ - Step 11157: {'lr': 0.0004952931496079143, 'samples': 2142144, 'steps': 11156, 'loss/train': 1.9701721668243408} +11/06/2021 22:47:41 - INFO - __main__ - Step 11162: {'lr': 0.0004952880236906988, 'samples': 2143104, 'steps': 11161, 'loss/train': 1.2465680837631226} +11/06/2021 22:47:43 - INFO - __main__ - Step 11166: {'lr': 0.0004952839209675096, 'samples': 2143872, 'steps': 11165, 'loss/train': 1.383769154548645}} +11/06/2021 22:47:45 - INFO - __main__ - Step 11170: {'lr': 0.000495279816475982, 'samples': 2144640, 'steps': 11169, 'loss/train': 1.741720199584961}}} +11/06/2021 22:47:47 - INFO - __main__ - Step 11174: {'lr': 0.0004952757102161457, 'samples': 2145408, 'steps': 11173, 'loss/train': 1.3439342975616455} +11/06/2021 22:47:49 - INFO - __main__ - Step 11178: {'lr': 0.0004952716021880301, 'samples': 2146176, 'steps': 11177, 'loss/train': 2.207341194152832}} +11/06/2021 22:47:49 - INFO - __main__ - Step 11178: {'lr': 0.0004952716021880301, 'samples': 2146176, 'steps': 11177, 'loss/train': 2.207341194152832}} +11/06/2021 22:47:49 - INFO - __main__ - Step 11178: {'lr': 0.0004952716021880301, 'samples': 2146176, 'steps': 11177, 'loss/train': 2.207341194152832}} +11/06/2021 22:47:55 - INFO - __main__ - Step 11189: {'lr': 0.0004952602959932644, 'samples': 2148288, 'steps': 11188, 'loss/train': 0.2998165488243103} +11/06/2021 22:47:57 - INFO - __main__ - Step 11194: {'lr': 0.0004952551523933682, 'samples': 2149248, 'steps': 11193, 'loss/train': 2.243593692779541}} +11/06/2021 22:48:00 - INFO - __main__ - Step 11199: {'lr': 0.0004952500060307674, 'samples': 2150208, 'steps': 11198, 'loss/train': 1.9236924648284912} +11/06/2021 22:48:02 - INFO - __main__ - Step 11203: {'lr': 0.0004952458869515782, 'samples': 2150976, 'steps': 11202, 'loss/train': 1.9771145582199097} +11/06/2021 22:48:02 - INFO - __main__ - Step 11203: {'lr': 0.0004952458869515782, 'samples': 2150976, 'steps': 11202, 'loss/train': 1.9771145582199097} +11/06/2021 22:48:05 - INFO - __main__ - Step 11210: {'lr': 0.0004952386743086107, 'samples': 2152320, 'steps': 11209, 'loss/train': 1.5023480653762817} +11/06/2021 22:48:07 - INFO - __main__ - Step 11215: {'lr': 0.0004952335191057447, 'samples': 2153280, 'steps': 11214, 'loss/train': 1.707075834274292}} +11/06/2021 22:48:10 - INFO - __main__ - Step 11220: {'lr': 0.0004952283611404176, 'samples': 2154240, 'steps': 11219, 'loss/train': 1.5863221883773804} +11/06/2021 22:48:12 - INFO - __main__ - Step 11224: {'lr': 0.000495224232779223, 'samples': 2155008, 'steps': 11223, 'loss/train': 1.7595049142837524}} +11/06/2021 22:48:12 - INFO - __main__ - Step 11224: {'lr': 0.000495224232779223, 'samples': 2155008, 'steps': 11223, 'loss/train': 1.7595049142837524}} +11/06/2021 22:48:15 - INFO - __main__ - Step 11231: {'lr': 0.0004952170038931217, 'samples': 2156352, 'steps': 11230, 'loss/train': 1.376936912536621}} +11/06/2021 22:48:18 - INFO - __main__ - Step 11236: {'lr': 0.0004952118370883101, 'samples': 2157312, 'steps': 11235, 'loss/train': 2.1615216732025146} +11/06/2021 22:48:20 - INFO - __main__ - Step 11240: {'lr': 0.0004952077016556619, 'samples': 2158080, 'steps': 11239, 'loss/train': 1.766661524772644}} +11/06/2021 22:48:22 - INFO - __main__ - Step 11244: {'lr': 0.0004952035644552249, 'samples': 2158848, 'steps': 11243, 'loss/train': 1.4197368621826172} +11/06/2021 22:48:24 - INFO - __main__ - Step 11248: {'lr': 0.0004951994254870286, 'samples': 2159616, 'steps': 11247, 'loss/train': 1.3976362943649292} +11/06/2021 22:48:25 - INFO - __main__ - Step 11252: {'lr': 0.0004951952847511033, 'samples': 2160384, 'steps': 11251, 'loss/train': 1.3120644092559814} +11/06/2021 22:48:25 - INFO - __main__ - Step 11252: {'lr': 0.0004951952847511033, 'samples': 2160384, 'steps': 11251, 'loss/train': 1.3120644092559814} +11/06/2021 22:48:29 - INFO - __main__ - Step 11260: {'lr': 0.0004951869979761842, 'samples': 2161920, 'steps': 11259, 'loss/train': 1.692081332206726}} +11/06/2021 22:48:31 - INFO - __main__ - Step 11264: {'lr': 0.0004951828519372503, 'samples': 2162688, 'steps': 11263, 'loss/train': 1.470284104347229}} +11/06/2021 22:48:33 - INFO - __main__ - Step 11268: {'lr': 0.0004951787041307066, 'samples': 2163456, 'steps': 11267, 'loss/train': 1.7130874395370483} +11/06/2021 22:48:35 - INFO - __main__ - Step 11272: {'lr': 0.0004951745545565831, 'samples': 2164224, 'steps': 11271, 'loss/train': 1.5138862133026123} +11/06/2021 22:48:37 - INFO - __main__ - Step 11277: {'lr': 0.000495169365103315, 'samples': 2165184, 'steps': 11276, 'loss/train': 1.7609519958496094}} +11/06/2021 22:48:39 - INFO - __main__ - Step 11281: {'lr': 0.0004951652115522462, 'samples': 2165952, 'steps': 11280, 'loss/train': 1.7629950046539307} +11/06/2021 22:48:41 - INFO - __main__ - Step 11285: {'lr': 0.0004951610562336949, 'samples': 2166720, 'steps': 11284, 'loss/train': 1.6244908571243286} +11/06/2021 22:48:43 - INFO - __main__ - Step 11289: {'lr': 0.0004951568991476908, 'samples': 2167488, 'steps': 11288, 'loss/train': 1.3978345394134521} +11/06/2021 22:48:45 - INFO - __main__ - Step 11293: {'lr': 0.0004951527402942643, 'samples': 2168256, 'steps': 11292, 'loss/train': 1.4760860204696655} +11/06/2021 22:48:47 - INFO - __main__ - Step 11298: {'lr': 0.0004951475392420884, 'samples': 2169216, 'steps': 11297, 'loss/train': 2.0938913822174072} +11/06/2021 22:48:47 - INFO - __main__ - Step 11298: {'lr': 0.0004951475392420884, 'samples': 2169216, 'steps': 11297, 'loss/train': 2.0938913822174072} +11/06/2021 22:48:51 - INFO - __main__ - Step 11305: {'lr': 0.0004951402531297482, 'samples': 2170560, 'steps': 11304, 'loss/train': 2.0329270362854004} +11/06/2021 22:48:53 - INFO - __main__ - Step 11309: {'lr': 0.0004951360872069309, 'samples': 2171328, 'steps': 11308, 'loss/train': 1.3344480991363525} +11/06/2021 22:48:55 - INFO - __main__ - Step 11314: {'lr': 0.0004951308773181856, 'samples': 2172288, 'steps': 11313, 'loss/train': 2.1913249492645264} +11/06/2021 22:48:58 - INFO - __main__ - Step 11319: {'lr': 0.0004951256646681356, 'samples': 2173248, 'steps': 11318, 'loss/train': 1.662163496017456}} +11/06/2021 22:49:00 - INFO - __main__ - Step 11323: {'lr': 0.0004951214925599957, 'samples': 2174016, 'steps': 11322, 'loss/train': 1.6424283981323242} +11/06/2021 22:49:00 - INFO - __main__ - Step 11323: {'lr': 0.0004951214925599957, 'samples': 2174016, 'steps': 11322, 'loss/train': 1.6424283981323242} +11/06/2021 22:49:03 - INFO - __main__ - Step 11330: {'lr': 0.0004951141871185224, 'samples': 2175360, 'steps': 11329, 'loss/train': 2.280247449874878}} +11/06/2021 22:49:06 - INFO - __main__ - Step 11335: {'lr': 0.0004951089656326919, 'samples': 2176320, 'steps': 11334, 'loss/train': 0.3128710389137268} +11/06/2021 22:49:08 - INFO - __main__ - Step 11339: {'lr': 0.0004951047864560629, 'samples': 2177088, 'steps': 11338, 'loss/train': 1.64912748336792}8} +11/06/2021 22:49:10 - INFO - __main__ - Step 11343: {'lr': 0.000495100605512387, 'samples': 2177856, 'steps': 11342, 'loss/train': 1.8620246648788452}} +11/06/2021 22:49:11 - INFO - __main__ - Step 11347: {'lr': 0.0004950964228016944, 'samples': 2178624, 'steps': 11346, 'loss/train': 1.8836588859558105} +11/06/2021 22:49:13 - INFO - __main__ - Step 11351: {'lr': 0.000495092238324015, 'samples': 2179392, 'steps': 11350, 'loss/train': 1.1730953454971313}} +11/06/2021 22:49:16 - INFO - __main__ - Step 11356: {'lr': 0.0004950870052421368, 'samples': 2180352, 'steps': 11355, 'loss/train': 1.806678295135498}} +11/06/2021 22:49:18 - INFO - __main__ - Step 11360: {'lr': 0.0004950828167888478, 'samples': 2181120, 'steps': 11359, 'loss/train': 1.9310498237609863} +11/06/2021 22:49:20 - INFO - __main__ - Step 11364: {'lr': 0.0004950786265686702, 'samples': 2181888, 'steps': 11363, 'loss/train': 1.6461005210876465} +11/06/2021 22:49:21 - INFO - __main__ - Step 11368: {'lr': 0.0004950744345816342, 'samples': 2182656, 'steps': 11367, 'loss/train': 1.2006498575210571} +11/06/2021 22:49:23 - INFO - __main__ - Step 11372: {'lr': 0.0004950702408277702, 'samples': 2183424, 'steps': 11371, 'loss/train': 1.4938647747039795} +11/06/2021 22:49:25 - INFO - __main__ - Step 11377: {'lr': 0.0004950649961508841, 'samples': 2184384, 'steps': 11376, 'loss/train': 2.194822311401367}} +11/06/2021 22:49:28 - INFO - __main__ - Step 11381: {'lr': 0.0004950607984217674, 'samples': 2185152, 'steps': 11380, 'loss/train': 1.64052414894104}}} +11/06/2021 22:49:30 - INFO - __main__ - Step 11385: {'lr': 0.0004950565989259207, 'samples': 2185920, 'steps': 11384, 'loss/train': 1.4204002618789673} +11/06/2021 22:49:31 - INFO - __main__ - Step 11389: {'lr': 0.0004950523976633745, 'samples': 2186688, 'steps': 11388, 'loss/train': 1.9979164600372314} +11/06/2021 22:49:33 - INFO - __main__ - Step 11393: {'lr': 0.000495048194634159, 'samples': 2187456, 'steps': 11392, 'loss/train': 1.676889419555664}4} +11/06/2021 22:49:36 - INFO - __main__ - Step 11398: {'lr': 0.0004950429383633073, 'samples': 2188416, 'steps': 11397, 'loss/train': 1.5339622497558594} +11/06/2021 22:49:38 - INFO - __main__ - Step 11403: {'lr': 0.0004950376793321413, 'samples': 2189376, 'steps': 11402, 'loss/train': 1.7271697521209717} +11/06/2021 22:49:40 - INFO - __main__ - Step 11407: {'lr': 0.0004950334701198222, 'samples': 2190144, 'steps': 11406, 'loss/train': 1.9516605138778687} +11/06/2021 22:49:40 - INFO - __main__ - Step 11407: {'lr': 0.0004950334701198222, 'samples': 2190144, 'steps': 11406, 'loss/train': 1.9516605138778687} +11/06/2021 22:49:43 - INFO - __main__ - Step 11414: {'lr': 0.0004950260997475623, 'samples': 2191488, 'steps': 11413, 'loss/train': 1.7055529356002808} +11/06/2021 22:49:46 - INFO - __main__ - Step 11419: {'lr': 0.0004950208318837892, 'samples': 2192448, 'steps': 11418, 'loss/train': 1.5548012256622314} +11/06/2021 22:49:48 - INFO - __main__ - Step 11424: {'lr': 0.0004950155612599511, 'samples': 2193408, 'steps': 11423, 'loss/train': 1.7228354215621948} +11/06/2021 22:49:48 - INFO - __main__ - Step 11424: {'lr': 0.0004950155612599511, 'samples': 2193408, 'steps': 11423, 'loss/train': 1.7228354215621948} +11/06/2021 22:49:51 - INFO - __main__ - Step 11430: {'lr': 0.0004950092328681428, 'samples': 2194560, 'steps': 11429, 'loss/train': 1.3537622690200806} +11/06/2021 22:49:54 - INFO - __main__ - Step 11435: {'lr': 0.0004950039561723703, 'samples': 2195520, 'steps': 11434, 'loss/train': 2.0817348957061768} +11/06/2021 22:49:56 - INFO - __main__ - Step 11440: {'lr': 0.0004949986767167228, 'samples': 2196480, 'steps': 11439, 'loss/train': 1.7402944564819336} +11/06/2021 22:49:58 - INFO - __main__ - Step 11444: {'lr': 0.0004949944511651347, 'samples': 2197248, 'steps': 11443, 'loss/train': 1.7834969758987427} +11/06/2021 22:49:58 - INFO - __main__ - Step 11444: {'lr': 0.0004949944511651347, 'samples': 2197248, 'steps': 11443, 'loss/train': 1.7834969758987427} +11/06/2021 22:50:02 - INFO - __main__ - Step 11451: {'lr': 0.0004949870521998312, 'samples': 2198592, 'steps': 11450, 'loss/train': 1.8337377309799194} +11/06/2021 22:50:04 - INFO - __main__ - Step 11456: {'lr': 0.0004949817639129832, 'samples': 2199552, 'steps': 11455, 'loss/train': 1.85826575756073}4} +11/06/2021 22:50:06 - INFO - __main__ - Step 11460: {'lr': 0.0004949775312965721, 'samples': 2200320, 'steps': 11459, 'loss/train': 1.5449903011322021} +11/06/2021 22:50:08 - INFO - __main__ - Step 11464: {'lr': 0.0004949732969140313, 'samples': 2201088, 'steps': 11463, 'loss/train': 1.5884931087493896} +11/06/2021 22:50:10 - INFO - __main__ - Step 11468: {'lr': 0.0004949690607653916, 'samples': 2201856, 'steps': 11467, 'loss/train': 1.5645625591278076} +11/06/2021 22:50:12 - INFO - __main__ - Step 11472: {'lr': 0.0004949648228506834, 'samples': 2202624, 'steps': 11471, 'loss/train': 1.6954563856124878} +11/06/2021 22:50:14 - INFO - __main__ - Step 11477: {'lr': 0.000494959522973811, 'samples': 2203584, 'steps': 11476, 'loss/train': 1.5947993993759155}} +11/06/2021 22:50:16 - INFO - __main__ - Step 11481: {'lr': 0.0004949552810855605, 'samples': 2204352, 'steps': 11480, 'loss/train': 1.7512733936309814} +11/06/2021 22:50:18 - INFO - __main__ - Step 11485: {'lr': 0.0004949510374313409, 'samples': 2205120, 'steps': 11484, 'loss/train': 1.3778972625732422} +11/06/2021 22:50:20 - INFO - __main__ - Step 11489: {'lr': 0.0004949467920111827, 'samples': 2205888, 'steps': 11488, 'loss/train': 2.2677342891693115} +11/06/2021 22:50:22 - INFO - __main__ - Step 11493: {'lr': 0.0004949425448251166, 'samples': 2206656, 'steps': 11492, 'loss/train': 1.598381757736206}} +11/06/2021 22:50:22 - INFO - __main__ - Step 11493: {'lr': 0.0004949425448251166, 'samples': 2206656, 'steps': 11492, 'loss/train': 1.598381757736206}} +11/06/2021 22:50:26 - INFO - __main__ - Step 11501: {'lr': 0.0004949340451553833, 'samples': 2208192, 'steps': 11500, 'loss/train': 1.7358423471450806} +11/06/2021 22:50:26 - INFO - __main__ - Step 11501: {'lr': 0.0004949340451553833, 'samples': 2208192, 'steps': 11500, 'loss/train': 1.7358423471450806} +11/06/2021 22:50:29 - INFO - __main__ - Step 11508: {'lr': 0.0004949266021502744, 'samples': 2209536, 'steps': 11507, 'loss/train': 1.2840288877487183} +11/06/2021 22:50:32 - INFO - __main__ - Step 11514: {'lr': 0.0004949202181275577, 'samples': 2210688, 'steps': 11513, 'loss/train': 1.9893686771392822} +11/06/2021 22:50:32 - INFO - __main__ - Step 11514: {'lr': 0.0004949202181275577, 'samples': 2210688, 'steps': 11513, 'loss/train': 1.9893686771392822} +11/06/2021 22:50:35 - INFO - __main__ - Step 11521: {'lr': 0.0004949127650798063, 'samples': 2212032, 'steps': 11520, 'loss/train': 1.619840145111084}} +11/06/2021 22:50:37 - INFO - __main__ - Step 11525: {'lr': 0.0004949085037675803, 'samples': 2212800, 'steps': 11524, 'loss/train': 1.7247838973999023} +11/06/2021 22:50:40 - INFO - __main__ - Step 11530: {'lr': 0.0004949031746443816, 'samples': 2213760, 'steps': 11529, 'loss/train': 1.8068318367004395} +11/06/2021 22:50:40 - INFO - __main__ - Step 11530: {'lr': 0.0004949031746443816, 'samples': 2213760, 'steps': 11529, 'loss/train': 1.8068318367004395} +11/06/2021 22:50:44 - INFO - __main__ - Step 11538: {'lr': 0.0004948946423091099, 'samples': 2215296, 'steps': 11537, 'loss/train': 1.8267381191253662} +11/06/2021 22:50:46 - INFO - __main__ - Step 11542: {'lr': 0.0004948903734931608, 'samples': 2216064, 'steps': 11541, 'loss/train': 1.5871480703353882} +11/06/2021 22:50:47 - INFO - __main__ - Step 11546: {'lr': 0.0004948861029117104, 'samples': 2216832, 'steps': 11545, 'loss/train': 1.524583339691162}} +11/06/2021 22:50:50 - INFO - __main__ - Step 11551: {'lr': 0.0004948807622022083, 'samples': 2217792, 'steps': 11550, 'loss/train': 2.3621954917907715} +11/06/2021 22:50:52 - INFO - __main__ - Step 11555: {'lr': 0.000494876487648493, 'samples': 2218560, 'steps': 11554, 'loss/train': 1.359278917312622}5} +11/06/2021 22:50:54 - INFO - __main__ - Step 11559: {'lr': 0.0004948722113293766, 'samples': 2219328, 'steps': 11558, 'loss/train': 1.786012053489685}} +11/06/2021 22:50:54 - INFO - __main__ - Step 11559: {'lr': 0.0004948722113293766, 'samples': 2219328, 'steps': 11558, 'loss/train': 1.786012053489685}} +11/06/2021 22:50:57 - INFO - __main__ - Step 11566: {'lr': 0.0004948647235230192, 'samples': 2220672, 'steps': 11565, 'loss/train': 1.6016157865524292} +11/06/2021 22:51:00 - INFO - __main__ - Step 11571: {'lr': 0.0004948593717799292, 'samples': 2221632, 'steps': 11570, 'loss/train': 1.6391667127609253} +11/06/2021 22:51:02 - INFO - __main__ - Step 11576: {'lr': 0.0004948540172785927, 'samples': 2222592, 'steps': 11575, 'loss/train': 1.5622731447219849} +11/06/2021 22:51:04 - INFO - __main__ - Step 11580: {'lr': 0.0004948497316916267, 'samples': 2223360, 'steps': 11579, 'loss/train': 2.0067150592803955} +11/06/2021 22:51:04 - INFO - __main__ - Step 11580: {'lr': 0.0004948497316916267, 'samples': 2223360, 'steps': 11579, 'loss/train': 2.0067150592803955} +11/06/2021 22:51:07 - INFO - __main__ - Step 11587: {'lr': 0.0004948422276669228, 'samples': 2224704, 'steps': 11586, 'loss/train': 1.91586434841156}5} +11/06/2021 22:51:10 - INFO - __main__ - Step 11592: {'lr': 0.0004948368643396035, 'samples': 2225664, 'steps': 11591, 'loss/train': 1.732541799545288}} +11/06/2021 22:51:12 - INFO - __main__ - Step 11597: {'lr': 0.0004948314982542914, 'samples': 2226624, 'steps': 11596, 'loss/train': 1.7309365272521973} +11/06/2021 22:51:12 - INFO - __main__ - Step 11597: {'lr': 0.0004948314982542914, 'samples': 2226624, 'steps': 11596, 'loss/train': 1.7309365272521973} +11/06/2021 22:51:15 - INFO - __main__ - Step 11604: {'lr': 0.0004948239811015416, 'samples': 2227968, 'steps': 11603, 'loss/train': 1.6033754348754883} +11/06/2021 22:51:18 - INFO - __main__ - Step 11609: {'lr': 0.0004948186083972934, 'samples': 2228928, 'steps': 11608, 'loss/train': 1.552068829536438}} +11/06/2021 22:51:20 - INFO - __main__ - Step 11613: {'lr': 0.0004948143082482852, 'samples': 2229696, 'steps': 11612, 'loss/train': 1.9601466655731201} +11/06/2021 22:51:22 - INFO - __main__ - Step 11618: {'lr': 0.0004948089305800638, 'samples': 2230656, 'steps': 11617, 'loss/train': 1.9734327793121338} +11/06/2021 22:51:22 - INFO - __main__ - Step 11618: {'lr': 0.0004948089305800638, 'samples': 2230656, 'steps': 11617, 'loss/train': 1.9734327793121338} +11/06/2021 22:51:26 - INFO - __main__ - Step 11625: {'lr': 0.000494801397211668, 'samples': 2232000, 'steps': 11624, 'loss/train': 1.5584590435028076}} +11/06/2021 22:51:28 - INFO - __main__ - Step 11629: {'lr': 0.0004947970900030346, 'samples': 2232768, 'steps': 11628, 'loss/train': 1.6569414138793945} +11/06/2021 22:51:30 - INFO - __main__ - Step 11634: {'lr': 0.0004947917035104564, 'samples': 2233728, 'steps': 11633, 'loss/train': 1.9105935096740723} +11/06/2021 22:51:30 - INFO - __main__ - Step 11634: {'lr': 0.0004947917035104564, 'samples': 2233728, 'steps': 11633, 'loss/train': 1.9105935096740723} +11/06/2021 22:51:34 - INFO - __main__ - Step 11642: {'lr': 0.0004947830793867896, 'samples': 2235264, 'steps': 11641, 'loss/train': 2.2054293155670166} +11/06/2021 22:51:36 - INFO - __main__ - Step 11646: {'lr': 0.0004947787646778491, 'samples': 2236032, 'steps': 11645, 'loss/train': 1.7138854265213013} +11/06/2021 22:51:38 - INFO - __main__ - Step 11650: {'lr': 0.0004947744482042122, 'samples': 2236800, 'steps': 11649, 'loss/train': 1.3429278135299683} +11/06/2021 22:51:40 - INFO - __main__ - Step 11655: {'lr': 0.0004947690501306088, 'samples': 2237760, 'steps': 11654, 'loss/train': 2.2113709449768066} +11/06/2021 22:51:42 - INFO - __main__ - Step 11660: {'lr': 0.0004947636492997765, 'samples': 2238720, 'steps': 11659, 'loss/train': 1.6339030265808105} +11/06/2021 22:51:42 - INFO - __main__ - Step 11660: {'lr': 0.0004947636492997765, 'samples': 2238720, 'steps': 11659, 'loss/train': 1.6339030265808105} +11/06/2021 22:51:46 - INFO - __main__ - Step 11667: {'lr': 0.0004947560835045826, 'samples': 2240064, 'steps': 11666, 'loss/train': 1.7168904542922974} +11/06/2021 22:51:48 - INFO - __main__ - Step 11671: {'lr': 0.0004947517577667996, 'samples': 2240832, 'steps': 11670, 'loss/train': 1.9244534969329834} +11/06/2021 22:51:50 - INFO - __main__ - Step 11676: {'lr': 0.0004947463481132438, 'samples': 2241792, 'steps': 11675, 'loss/train': 1.5373907089233398} +11/06/2021 22:51:50 - INFO - __main__ - Step 11676: {'lr': 0.0004947463481132438, 'samples': 2241792, 'steps': 11675, 'loss/train': 1.5373907089233398} +11/06/2021 22:51:54 - INFO - __main__ - Step 11684: {'lr': 0.0004947376869330755, 'samples': 2243328, 'steps': 11683, 'loss/train': 2.4655892848968506} +11/06/2021 22:51:56 - INFO - __main__ - Step 11688: {'lr': 0.0004947333536963753, 'samples': 2244096, 'steps': 11687, 'loss/train': 1.7653391361236572} +11/06/2021 22:51:58 - INFO - __main__ - Step 11692: {'lr': 0.0004947290186953057, 'samples': 2244864, 'steps': 11691, 'loss/train': 1.3742139339447021} +11/06/2021 22:52:00 - INFO - __main__ - Step 11697: {'lr': 0.0004947235974628723, 'samples': 2245824, 'steps': 11696, 'loss/train': 1.703428864479065}} +11/06/2021 22:52:02 - INFO - __main__ - Step 11701: {'lr': 0.0004947192584920866, 'samples': 2246592, 'steps': 11700, 'loss/train': 1.931963324546814}} +11/06/2021 22:52:05 - INFO - __main__ - Step 11705: {'lr': 0.0004947149177570332, 'samples': 2247360, 'steps': 11704, 'loss/train': 1.6442228555679321} +11/06/2021 22:52:06 - INFO - __main__ - Step 11709: {'lr': 0.0004947105752577436, 'samples': 2248128, 'steps': 11708, 'loss/train': 1.3050994873046875} +11/06/2021 22:52:08 - INFO - __main__ - Step 11713: {'lr': 0.000494706230994249, 'samples': 2248896, 'steps': 11712, 'loss/train': 1.7337501049041748}} +11/06/2021 22:52:11 - INFO - __main__ - Step 11717: {'lr': 0.0004947018849665809, 'samples': 2249664, 'steps': 11716, 'loss/train': 1.7236446142196655} +11/06/2021 22:52:13 - INFO - __main__ - Step 11721: {'lr': 0.0004946975371747704, 'samples': 2250432, 'steps': 11720, 'loss/train': 2.156588315963745}} +11/06/2021 22:52:14 - INFO - __main__ - Step 11725: {'lr': 0.000494693187618849, 'samples': 2251200, 'steps': 11724, 'loss/train': 1.6982334852218628}} +11/06/2021 22:52:16 - INFO - __main__ - Step 11729: {'lr': 0.000494688836298848, 'samples': 2251968, 'steps': 11728, 'loss/train': 1.9926396608352661}} +11/06/2021 22:52:18 - INFO - __main__ - Step 11734: {'lr': 0.0004946833946681575, 'samples': 2252928, 'steps': 11733, 'loss/train': 1.9588221311569214} +11/06/2021 22:52:18 - INFO - __main__ - Step 11734: {'lr': 0.0004946833946681575, 'samples': 2252928, 'steps': 11733, 'loss/train': 1.9588221311569214} +11/06/2021 22:52:23 - INFO - __main__ - Step 11742: {'lr': 0.0004946746823260491, 'samples': 2254464, 'steps': 11741, 'loss/train': 0.8344317078590393} +11/06/2021 22:52:24 - INFO - __main__ - Step 11746: {'lr': 0.00049467032350906, 'samples': 2255232, 'steps': 11745, 'loss/train': 1.7040636539459229}3} +11/06/2021 22:52:26 - INFO - __main__ - Step 11750: {'lr': 0.0004946659629281561, 'samples': 2256000, 'steps': 11749, 'loss/train': 1.6414493322372437} +11/06/2021 22:52:29 - INFO - __main__ - Step 11755: {'lr': 0.0004946605097215691, 'samples': 2256960, 'steps': 11754, 'loss/train': 1.4197173118591309} +11/06/2021 22:52:29 - INFO - __main__ - Step 11755: {'lr': 0.0004946605097215691, 'samples': 2256960, 'steps': 11754, 'loss/train': 1.4197173118591309} +11/06/2021 22:52:32 - INFO - __main__ - Step 11762: {'lr': 0.0004946528706022703, 'samples': 2258304, 'steps': 11761, 'loss/train': 2.078275442123413}} +11/06/2021 22:52:34 - INFO - __main__ - Step 11766: {'lr': 0.0004946485029660219, 'samples': 2259072, 'steps': 11765, 'loss/train': 1.9496246576309204} +11/06/2021 22:52:37 - INFO - __main__ - Step 11771: {'lr': 0.0004946430409404311, 'samples': 2260032, 'steps': 11770, 'loss/train': 1.5809372663497925} +11/06/2021 22:52:37 - INFO - __main__ - Step 11771: {'lr': 0.0004946430409404311, 'samples': 2260032, 'steps': 11770, 'loss/train': 1.5809372663497925} +11/06/2021 22:52:41 - INFO - __main__ - Step 11779: {'lr': 0.0004946342959674278, 'samples': 2261568, 'steps': 11778, 'loss/train': 1.6700574159622192} +11/06/2021 22:52:42 - INFO - __main__ - Step 11783: {'lr': 0.0004946299208354279, 'samples': 2262336, 'steps': 11782, 'loss/train': 1.7613064050674438} +11/06/2021 22:52:45 - INFO - __main__ - Step 11788: {'lr': 0.0004946244494403361, 'samples': 2263296, 'steps': 11787, 'loss/train': 1.7674616575241089} +11/06/2021 22:52:47 - INFO - __main__ - Step 11793: {'lr': 0.0004946189752896443, 'samples': 2264256, 'steps': 11792, 'loss/train': 1.361173152923584}} +11/06/2021 22:52:47 - INFO - __main__ - Step 11793: {'lr': 0.0004946189752896443, 'samples': 2264256, 'steps': 11792, 'loss/train': 1.361173152923584}} +11/06/2021 22:52:47 - INFO - __main__ - Step 11793: {'lr': 0.0004946189752896443, 'samples': 2264256, 'steps': 11792, 'loss/train': 1.361173152923584}} +11/06/2021 22:52:52 - INFO - __main__ - Step 11803: {'lr': 0.0004946080187217072, 'samples': 2266176, 'steps': 11802, 'loss/train': 1.8065892457962036} +11/06/2021 22:52:54 - INFO - __main__ - Step 11808: {'lr': 0.0004946025363045854, 'samples': 2267136, 'steps': 11807, 'loss/train': 1.8952033519744873} +11/06/2021 22:52:54 - INFO - __main__ - Step 11808: {'lr': 0.0004946025363045854, 'samples': 2267136, 'steps': 11807, 'loss/train': 1.8952033519744873} +11/06/2021 22:52:54 - INFO - __main__ - Step 11808: {'lr': 0.0004946025363045854, 'samples': 2267136, 'steps': 11807, 'loss/train': 1.8952033519744873} +11/06/2021 22:53:00 - INFO - __main__ - Step 11819: {'lr': 0.0004945904652881611, 'samples': 2269248, 'steps': 11818, 'loss/train': 1.905003547668457}} +11/06/2021 22:53:00 - INFO - __main__ - Step 11819: {'lr': 0.0004945904652881611, 'samples': 2269248, 'steps': 11818, 'loss/train': 1.905003547668457}} +11/06/2021 22:53:04 - INFO - __main__ - Step 11827: {'lr': 0.0004945816779912272, 'samples': 2270784, 'steps': 11826, 'loss/train': 1.1215801239013672} +11/06/2021 22:53:06 - INFO - __main__ - Step 11831: {'lr': 0.0004945772816978309, 'samples': 2271552, 'steps': 11830, 'loss/train': 1.8250958919525146} +11/06/2021 22:53:08 - INFO - __main__ - Step 11836: {'lr': 0.0004945717838515275, 'samples': 2272512, 'steps': 11835, 'loss/train': 1.7910774946212769} +11/06/2021 22:53:11 - INFO - __main__ - Step 11841: {'lr': 0.0004945662832502171, 'samples': 2273472, 'steps': 11840, 'loss/train': 1.478073000907898}} +11/06/2021 22:53:13 - INFO - __main__ - Step 11845: {'lr': 0.0004945618807856056, 'samples': 2274240, 'steps': 11844, 'loss/train': 1.2191367149353027} +11/06/2021 22:53:15 - INFO - __main__ - Step 11849: {'lr': 0.0004945574765578612, 'samples': 2275008, 'steps': 11848, 'loss/train': 1.4972808361053467} +11/06/2021 22:53:16 - INFO - __main__ - Step 11853: {'lr': 0.0004945530705670156, 'samples': 2275776, 'steps': 11852, 'loss/train': 1.7779545783996582} +11/06/2021 22:53:19 - INFO - __main__ - Step 11857: {'lr': 0.0004945486628131006, 'samples': 2276544, 'steps': 11856, 'loss/train': 1.342666506767273}} +11/06/2021 22:53:21 - INFO - __main__ - Step 11862: {'lr': 0.0004945431506414386, 'samples': 2277504, 'steps': 11861, 'loss/train': 2.1039764881134033} +11/06/2021 22:53:21 - INFO - __main__ - Step 11862: {'lr': 0.0004945431506414386, 'samples': 2277504, 'steps': 11861, 'loss/train': 2.1039764881134033} +11/06/2021 22:53:24 - INFO - __main__ - Step 11869: {'lr': 0.0004945354289732565, 'samples': 2278848, 'steps': 11868, 'loss/train': 1.6801567077636719} +11/06/2021 22:53:26 - INFO - __main__ - Step 11873: {'lr': 0.0004945310141673816, 'samples': 2279616, 'steps': 11872, 'loss/train': 1.7067826986312866} +11/06/2021 22:53:29 - INFO - __main__ - Step 11878: {'lr': 0.0004945254931809489, 'samples': 2280576, 'steps': 11877, 'loss/train': 1.5857558250427246} +11/06/2021 22:53:31 - INFO - __main__ - Step 11882: {'lr': 0.0004945210744085702, 'samples': 2281344, 'steps': 11881, 'loss/train': 2.2412431240081787} +11/06/2021 22:53:31 - INFO - __main__ - Step 11882: {'lr': 0.0004945210744085702, 'samples': 2281344, 'steps': 11881, 'loss/train': 2.2412431240081787} +11/06/2021 22:53:34 - INFO - __main__ - Step 11889: {'lr': 0.000494513337315096, 'samples': 2282688, 'steps': 11888, 'loss/train': 1.7061456441879272}} +11/06/2021 22:53:37 - INFO - __main__ - Step 11894: {'lr': 0.0004945078075145292, 'samples': 2283648, 'steps': 11893, 'loss/train': 2.0001227855682373} +11/06/2021 22:53:39 - INFO - __main__ - Step 11899: {'lr': 0.0004945022749596764, 'samples': 2284608, 'steps': 11898, 'loss/train': 1.6990892887115479} +11/06/2021 22:53:41 - INFO - __main__ - Step 11903: {'lr': 0.0004944978469327499, 'samples': 2285376, 'steps': 11902, 'loss/train': 1.8978601694107056} +11/06/2021 22:53:43 - INFO - __main__ - Step 11907: {'lr': 0.0004944934171431522, 'samples': 2286144, 'steps': 11906, 'loss/train': 1.794429898262024}} +11/06/2021 22:53:43 - INFO - __main__ - Step 11907: {'lr': 0.0004944934171431522, 'samples': 2286144, 'steps': 11906, 'loss/train': 1.794429898262024}} +11/06/2021 22:53:46 - INFO - __main__ - Step 11914: {'lr': 0.0004944856607700243, 'samples': 2287488, 'steps': 11913, 'loss/train': 1.3514317274093628} +11/06/2021 22:53:49 - INFO - __main__ - Step 11920: {'lr': 0.0004944790081538969, 'samples': 2288640, 'steps': 11919, 'loss/train': 1.7780016660690308} +11/06/2021 22:53:51 - INFO - __main__ - Step 11924: {'lr': 0.0004944745708733025, 'samples': 2289408, 'steps': 11923, 'loss/train': 2.0285587310791016} +11/06/2021 22:53:53 - INFO - __main__ - Step 11928: {'lr': 0.0004944701318302046, 'samples': 2290176, 'steps': 11927, 'loss/train': 1.5972325801849365} +11/06/2021 22:53:55 - INFO - __main__ - Step 11932: {'lr': 0.0004944656910246352, 'samples': 2290944, 'steps': 11931, 'loss/train': 1.651598572731018}} +11/06/2021 22:53:57 - INFO - __main__ - Step 11936: {'lr': 0.0004944612484566263, 'samples': 2291712, 'steps': 11935, 'loss/train': 1.43559730052948}}} +11/06/2021 22:53:59 - INFO - __main__ - Step 11941: {'lr': 0.0004944556927682335, 'samples': 2292672, 'steps': 11940, 'loss/train': 1.7804417610168457} +11/06/2021 22:54:01 - INFO - __main__ - Step 11945: {'lr': 0.0004944512462348528, 'samples': 2293440, 'steps': 11944, 'loss/train': 1.9006822109222412} +11/06/2021 22:54:01 - INFO - __main__ - Step 11945: {'lr': 0.0004944512462348528, 'samples': 2293440, 'steps': 11944, 'loss/train': 1.9006822109222412} +11/06/2021 22:54:04 - INFO - __main__ - Step 11952: {'lr': 0.0004944434605608367, 'samples': 2294784, 'steps': 11951, 'loss/train': 1.2838270664215088} +11/06/2021 22:54:06 - INFO - __main__ - Step 11956: {'lr': 0.0004944390091811111, 'samples': 2295552, 'steps': 11955, 'loss/train': 1.7346197366714478} +11/06/2021 22:54:09 - INFO - __main__ - Step 11962: {'lr': 0.0004944323288073192, 'samples': 2296704, 'steps': 11961, 'loss/train': 1.4151784181594849} +11/06/2021 22:54:11 - INFO - __main__ - Step 11966: {'lr': 0.0004944278730220359, 'samples': 2297472, 'steps': 11965, 'loss/train': 1.4997888803482056} +11/06/2021 22:54:11 - INFO - __main__ - Step 11966: {'lr': 0.0004944278730220359, 'samples': 2297472, 'steps': 11965, 'loss/train': 1.4997888803482056} +11/06/2021 22:54:15 - INFO - __main__ - Step 11973: {'lr': 0.0004944200711575956, 'samples': 2298816, 'steps': 11972, 'loss/train': 1.9672355651855469} +11/06/2021 22:54:17 - INFO - __main__ - Step 11977: {'lr': 0.0004944156105264308, 'samples': 2299584, 'steps': 11976, 'loss/train': 0.3471572995185852} +11/06/2021 22:54:19 - INFO - __main__ - Step 11982: {'lr': 0.0004944100322595558, 'samples': 2300544, 'steps': 11981, 'loss/train': 1.5777186155319214} +11/06/2021 22:54:21 - INFO - __main__ - Step 11986: {'lr': 0.0004944055676637599, 'samples': 2301312, 'steps': 11985, 'loss/train': 1.4917117357254028} +11/06/2021 22:54:21 - INFO - __main__ - Step 11986: {'lr': 0.0004944055676637599, 'samples': 2301312, 'steps': 11985, 'loss/train': 1.4917117357254028} +11/06/2021 22:54:25 - INFO - __main__ - Step 11993: {'lr': 0.0004943977503813092, 'samples': 2302656, 'steps': 11992, 'loss/train': 1.3840059041976929} +11/06/2021 22:54:27 - INFO - __main__ - Step 11998: {'lr': 0.0004943921633044644, 'samples': 2303616, 'steps': 11997, 'loss/train': 1.752882480621338}} +11/06/2021 22:54:29 - INFO - __main__ - Step 12003: {'lr': 0.0004943865734746364, 'samples': 2304576, 'steps': 12002, 'loss/train': 1.8876904249191284} +11/06/2021 22:54:29 - INFO - __main__ - Step 12003: {'lr': 0.0004943865734746364, 'samples': 2304576, 'steps': 12002, 'loss/train': 1.8876904249191284} +11/06/2021 22:54:33 - INFO - __main__ - Step 12010: {'lr': 0.0004943787430879846, 'samples': 2305920, 'steps': 12009, 'loss/train': 1.99528169631958}4} +11/06/2021 22:54:35 - INFO - __main__ - Step 12014: {'lr': 0.000494374266158823, 'samples': 2306688, 'steps': 12013, 'loss/train': 1.9051744937896729}} +11/06/2021 22:54:37 - INFO - __main__ - Step 12018: {'lr': 0.000494369787467881, 'samples': 2307456, 'steps': 12017, 'loss/train': 1.328963041305542}}} +11/06/2021 22:54:37 - INFO - __main__ - Step 12018: {'lr': 0.000494369787467881, 'samples': 2307456, 'steps': 12017, 'loss/train': 1.328963041305542}}} +11/06/2021 22:54:37 - INFO - __main__ - Step 12018: {'lr': 0.000494369787467881, 'samples': 2307456, 'steps': 12017, 'loss/train': 1.328963041305542}}} +11/06/2021 22:54:42 - INFO - __main__ - Step 12029: {'lr': 0.0004943574619838741, 'samples': 2309568, 'steps': 12028, 'loss/train': 1.7877787351608276} +11/06/2021 22:54:45 - INFO - __main__ - Step 12034: {'lr': 0.0004943518550869552, 'samples': 2310528, 'steps': 12033, 'loss/train': 1.0278202295303345} +11/06/2021 22:54:47 - INFO - __main__ - Step 12039: {'lr': 0.0004943462454375069, 'samples': 2311488, 'steps': 12038, 'loss/train': 1.6484863758087158} +11/06/2021 22:54:50 - INFO - __main__ - Step 12044: {'lr': 0.0004943406330355925, 'samples': 2312448, 'steps': 12043, 'loss/train': 1.159117341041565}} +11/06/2021 22:54:50 - INFO - __main__ - Step 12044: {'lr': 0.0004943406330355925, 'samples': 2312448, 'steps': 12043, 'loss/train': 1.159117341041565}} +11/06/2021 22:54:50 - INFO - __main__ - Step 12044: {'lr': 0.0004943406330355925, 'samples': 2312448, 'steps': 12043, 'loss/train': 1.159117341041565}} +11/06/2021 22:54:54 - INFO - __main__ - Step 12054: {'lr': 0.0004943293999746179, 'samples': 2314368, 'steps': 12053, 'loss/train': 1.585003137588501}} +11/06/2021 22:54:57 - INFO - __main__ - Step 12059: {'lr': 0.0004943237793156844, 'samples': 2315328, 'steps': 12058, 'loss/train': 2.4570651054382324} +11/06/2021 22:54:59 - INFO - __main__ - Step 12063: {'lr': 0.0004943192808069411, 'samples': 2316096, 'steps': 12062, 'loss/train': 1.2292014360427856} +11/06/2021 22:54:59 - INFO - __main__ - Step 12063: {'lr': 0.0004943192808069411, 'samples': 2316096, 'steps': 12062, 'loss/train': 1.2292014360427856} +11/06/2021 22:55:03 - INFO - __main__ - Step 12070: {'lr': 0.0004943114041783296, 'samples': 2317440, 'steps': 12069, 'loss/train': 1.788710355758667}} +11/06/2021 22:55:05 - INFO - __main__ - Step 12075: {'lr': 0.0004943057747125371, 'samples': 2318400, 'steps': 12074, 'loss/train': 1.8841195106506348} +11/06/2021 22:55:07 - INFO - __main__ - Step 12079: {'lr': 0.0004943012691584526, 'samples': 2319168, 'steps': 12078, 'loss/train': 1.6468000411987305} +11/06/2021 22:55:07 - INFO - __main__ - Step 12079: {'lr': 0.0004943012691584526, 'samples': 2319168, 'steps': 12078, 'loss/train': 1.6468000411987305} +11/06/2021 22:55:11 - INFO - __main__ - Step 12086: {'lr': 0.0004942933802008066, 'samples': 2320512, 'steps': 12085, 'loss/train': 2.0663843154907227} +11/06/2021 22:55:13 - INFO - __main__ - Step 12090: {'lr': 0.0004942888698033515, 'samples': 2321280, 'steps': 12089, 'loss/train': 1.889116883277893}} +11/06/2021 22:55:15 - INFO - __main__ - Step 12094: {'lr': 0.0004942843576447316, 'samples': 2322048, 'steps': 12093, 'loss/train': 1.6451750993728638} +11/06/2021 22:55:17 - INFO - __main__ - Step 12099: {'lr': 0.0004942787149698687, 'samples': 2323008, 'steps': 12098, 'loss/train': 1.9871211051940918} +11/06/2021 22:55:17 - INFO - __main__ - Step 12099: {'lr': 0.0004942787149698687, 'samples': 2323008, 'steps': 12098, 'loss/train': 1.9871211051940918} +11/06/2021 22:55:21 - INFO - __main__ - Step 12107: {'lr': 0.0004942696809665668, 'samples': 2324544, 'steps': 12106, 'loss/train': 1.9903008937835693} +11/06/2021 22:55:23 - INFO - __main__ - Step 12111: {'lr': 0.0004942651613233599, 'samples': 2325312, 'steps': 12110, 'loss/train': 1.8227951526641846} +11/06/2021 22:55:25 - INFO - __main__ - Step 12115: {'lr': 0.0004942606399191593, 'samples': 2326080, 'steps': 12114, 'loss/train': 1.4733009338378906} +11/06/2021 22:55:25 - INFO - __main__ - Step 12115: {'lr': 0.0004942606399191593, 'samples': 2326080, 'steps': 12114, 'loss/train': 1.4733009338378906} +11/06/2021 22:55:25 - INFO - __main__ - Step 12115: {'lr': 0.0004942606399191593, 'samples': 2326080, 'steps': 12114, 'loss/train': 1.4733009338378906} +11/06/2021 22:55:31 - INFO - __main__ - Step 12126: {'lr': 0.0004942481969777495, 'samples': 2328192, 'steps': 12125, 'loss/train': 2.258380889892578}} +11/06/2021 22:55:33 - INFO - __main__ - Step 12131: {'lr': 0.000494242536693071, 'samples': 2329152, 'steps': 12130, 'loss/train': 1.718927264213562}}} +11/06/2021 22:55:35 - INFO - __main__ - Step 12135: {'lr': 0.0004942380064843906, 'samples': 2329920, 'steps': 12134, 'loss/train': 1.8256616592407227} +11/06/2021 22:55:38 - INFO - __main__ - Step 12139: {'lr': 0.0004942334745149122, 'samples': 2330688, 'steps': 12138, 'loss/train': 2.0332870483398438} +11/06/2021 22:55:40 - INFO - __main__ - Step 12143: {'lr': 0.0004942289407846684, 'samples': 2331456, 'steps': 12142, 'loss/train': 0.5399057865142822} +11/06/2021 22:55:41 - INFO - __main__ - Step 12147: {'lr': 0.000494224405293692, 'samples': 2332224, 'steps': 12146, 'loss/train': 1.870377779006958}2} +11/06/2021 22:55:43 - INFO - __main__ - Step 12152: {'lr': 0.0004942187334539908, 'samples': 2333184, 'steps': 12151, 'loss/train': 1.949316382408142}} +11/06/2021 22:55:45 - INFO - __main__ - Step 12156: {'lr': 0.0004942141940014854, 'samples': 2333952, 'steps': 12155, 'loss/train': 1.7409350872039795} +11/06/2021 22:55:47 - INFO - __main__ - Step 12160: {'lr': 0.0004942096527883538, 'samples': 2334720, 'steps': 12159, 'loss/train': 1.4643501043319702} +11/06/2021 22:55:50 - INFO - __main__ - Step 12164: {'lr': 0.0004942051098146284, 'samples': 2335488, 'steps': 12163, 'loss/train': 1.9286428689956665} +11/06/2021 22:55:51 - INFO - __main__ - Step 12168: {'lr': 0.0004942005650803421, 'samples': 2336256, 'steps': 12167, 'loss/train': 1.5838422775268555} +11/06/2021 22:55:53 - INFO - __main__ - Step 12173: {'lr': 0.0004941948816867455, 'samples': 2337216, 'steps': 12172, 'loss/train': 1.5987201929092407} +11/06/2021 22:55:56 - INFO - __main__ - Step 12178: {'lr': 0.0004941891955423878, 'samples': 2338176, 'steps': 12177, 'loss/train': 2.281742811203003}} +11/06/2021 22:55:56 - INFO - __main__ - Step 12178: {'lr': 0.0004941891955423878, 'samples': 2338176, 'steps': 12177, 'loss/train': 2.281742811203003}} +11/06/2021 22:56:00 - INFO - __main__ - Step 12185: {'lr': 0.0004941812303191302, 'samples': 2339520, 'steps': 12184, 'loss/train': 1.8058403730392456} +11/06/2021 22:56:01 - INFO - __main__ - Step 12189: {'lr': 0.0004941766763424373, 'samples': 2340288, 'steps': 12188, 'loss/train': 1.433286190032959}} +11/06/2021 22:56:03 - INFO - __main__ - Step 12193: {'lr': 0.0004941721206053885, 'samples': 2341056, 'steps': 12192, 'loss/train': 3.6256818771362305} +11/06/2021 22:56:06 - INFO - __main__ - Step 12198: {'lr': 0.000494166423458627, 'samples': 2342016, 'steps': 12197, 'loss/train': 2.043381929397583}5} +11/06/2021 22:56:06 - INFO - __main__ - Step 12198: {'lr': 0.000494166423458627, 'samples': 2342016, 'steps': 12197, 'loss/train': 2.043381929397583}5} +11/06/2021 22:56:10 - INFO - __main__ - Step 12206: {'lr': 0.000494157302302919, 'samples': 2343552, 'steps': 12205, 'loss/train': 1.4476592540740967}} +11/06/2021 22:56:11 - INFO - __main__ - Step 12210: {'lr': 0.0004941527390847243, 'samples': 2344320, 'steps': 12209, 'loss/train': 1.1334985494613647} +11/06/2021 22:56:11 - INFO - __main__ - Step 12210: {'lr': 0.0004941527390847243, 'samples': 2344320, 'steps': 12209, 'loss/train': 1.1334985494613647} +11/06/2021 22:56:15 - INFO - __main__ - Step 12218: {'lr': 0.0004941436073678179, 'samples': 2345856, 'steps': 12217, 'loss/train': 1.678484320640564}} +11/06/2021 22:56:17 - INFO - __main__ - Step 12222: {'lr': 0.0004941390388691719, 'samples': 2346624, 'steps': 12221, 'loss/train': 1.6822108030319214} +11/06/2021 22:56:19 - INFO - __main__ - Step 12226: {'lr': 0.0004941344686104414, 'samples': 2347392, 'steps': 12225, 'loss/train': 1.5134607553482056} +11/06/2021 22:56:21 - INFO - __main__ - Step 12231: {'lr': 0.0004941287533119597, 'samples': 2348352, 'steps': 12230, 'loss/train': 1.1296072006225586} +11/06/2021 22:56:21 - INFO - __main__ - Step 12231: {'lr': 0.0004941287533119597, 'samples': 2348352, 'steps': 12230, 'loss/train': 1.1296072006225586} +11/06/2021 22:56:25 - INFO - __main__ - Step 12238: {'lr': 0.0004941207472740724, 'samples': 2349696, 'steps': 12237, 'loss/train': 1.9084161520004272} +11/06/2021 22:56:27 - INFO - __main__ - Step 12242: {'lr': 0.0004941161699753335, 'samples': 2350464, 'steps': 12241, 'loss/train': 2.5496790409088135} +11/06/2021 22:56:30 - INFO - __main__ - Step 12248: {'lr': 0.0004941093007273859, 'samples': 2351616, 'steps': 12247, 'loss/train': 2.001997470855713}} +11/06/2021 22:56:30 - INFO - __main__ - Step 12248: {'lr': 0.0004941093007273859, 'samples': 2351616, 'steps': 12247, 'loss/train': 2.001997470855713}} +11/06/2021 22:56:34 - INFO - __main__ - Step 12255: {'lr': 0.0004941012816001575, 'samples': 2352960, 'steps': 12254, 'loss/train': 1.6902923583984375} +11/06/2021 22:56:35 - INFO - __main__ - Step 12259: {'lr': 0.0004940966968219881, 'samples': 2353728, 'steps': 12258, 'loss/train': 1.807405948638916}} +11/06/2021 22:56:37 - INFO - __main__ - Step 12264: {'lr': 0.0004940909633745905, 'samples': 2354688, 'steps': 12263, 'loss/train': 1.749647617340088}} +11/06/2021 22:56:37 - INFO - __main__ - Step 12264: {'lr': 0.0004940909633745905, 'samples': 2354688, 'steps': 12263, 'loss/train': 1.749647617340088}} +11/06/2021 22:56:41 - INFO - __main__ - Step 12271: {'lr': 0.0004940829319289361, 'samples': 2356032, 'steps': 12270, 'loss/train': 1.8408467769622803} +11/06/2021 22:56:43 - INFO - __main__ - Step 12275: {'lr': 0.000494078340111848, 'samples': 2356800, 'steps': 12274, 'loss/train': 1.8969393968582153}} +11/06/2021 22:56:45 - INFO - __main__ - Step 12280: {'lr': 0.0004940725978659881, 'samples': 2357760, 'steps': 12279, 'loss/train': 1.9200348854064941} +11/06/2021 22:56:48 - INFO - __main__ - Step 12285: {'lr': 0.0004940668528707446, 'samples': 2358720, 'steps': 12284, 'loss/train': 1.4615005254745483} +11/06/2021 22:56:48 - INFO - __main__ - Step 12285: {'lr': 0.0004940668528707446, 'samples': 2358720, 'steps': 12284, 'loss/train': 1.4615005254745483} +11/06/2021 22:56:51 - INFO - __main__ - Step 12292: {'lr': 0.0004940588052585624, 'samples': 2360064, 'steps': 12291, 'loss/train': 1.7617274522781372} +11/06/2021 22:56:53 - INFO - __main__ - Step 12296: {'lr': 0.0004940542042036974, 'samples': 2360832, 'steps': 12295, 'loss/train': 1.7313815355300903} +11/06/2021 22:56:55 - INFO - __main__ - Step 12301: {'lr': 0.0004940484504108612, 'samples': 2361792, 'steps': 12300, 'loss/train': 1.4371073246002197} +11/06/2021 22:56:55 - INFO - __main__ - Step 12301: {'lr': 0.0004940484504108612, 'samples': 2361792, 'steps': 12300, 'loss/train': 1.4371073246002197} +11/06/2021 22:57:00 - INFO - __main__ - Step 12309: {'lr': 0.0004940392386241981, 'samples': 2363328, 'steps': 12308, 'loss/train': 2.2593603134155273} +11/06/2021 22:57:01 - INFO - __main__ - Step 12313: {'lr': 0.0004940346300918024, 'samples': 2364096, 'steps': 12312, 'loss/train': 1.6373891830444336} +11/06/2021 22:57:03 - INFO - __main__ - Step 12317: {'lr': 0.0004940300198000748, 'samples': 2364864, 'steps': 12316, 'loss/train': 1.8684685230255127} +11/06/2021 22:57:06 - INFO - __main__ - Step 12322: {'lr': 0.0004940242544614056, 'samples': 2365824, 'steps': 12321, 'loss/train': 1.541722297668457}} +11/06/2021 22:57:08 - INFO - __main__ - Step 12326: {'lr': 0.0004940196402113031, 'samples': 2366592, 'steps': 12325, 'loss/train': 1.683254361152649}} +11/06/2021 22:57:08 - INFO - __main__ - Step 12326: {'lr': 0.0004940196402113031, 'samples': 2366592, 'steps': 12325, 'loss/train': 1.683254361152649}} +11/06/2021 22:57:11 - INFO - __main__ - Step 12333: {'lr': 0.0004940115610405114, 'samples': 2367936, 'steps': 12332, 'loss/train': 1.9940561056137085} +11/06/2021 22:57:14 - INFO - __main__ - Step 12339: {'lr': 0.000494004631749003, 'samples': 2369088, 'steps': 12338, 'loss/train': 1.7027802467346191}} +11/06/2021 22:57:16 - INFO - __main__ - Step 12343: {'lr': 0.0004940000100224295, 'samples': 2369856, 'steps': 12342, 'loss/train': 1.2512726783752441} +11/06/2021 22:57:18 - INFO - __main__ - Step 12347: {'lr': 0.0004939953865367735, 'samples': 2370624, 'steps': 12346, 'loss/train': 1.1613168716430664} +11/06/2021 22:57:18 - INFO - __main__ - Step 12347: {'lr': 0.0004939953865367735, 'samples': 2370624, 'steps': 12346, 'loss/train': 1.1613168716430664} +11/06/2021 22:57:21 - INFO - __main__ - Step 12354: {'lr': 0.0004939872912041844, 'samples': 2371968, 'steps': 12353, 'loss/train': 1.7622441053390503} +11/06/2021 22:57:24 - INFO - __main__ - Step 12360: {'lr': 0.0004939803480601333, 'samples': 2373120, 'steps': 12359, 'loss/train': 1.4958027601242065} +11/06/2021 22:57:24 - INFO - __main__ - Step 12360: {'lr': 0.0004939803480601333, 'samples': 2373120, 'steps': 12359, 'loss/train': 1.4958027601242065} +11/06/2021 22:57:27 - INFO - __main__ - Step 12366: {'lr': 0.0004939734009584661, 'samples': 2374272, 'steps': 12365, 'loss/train': 2.075040578842163}} +11/06/2021 22:57:29 - INFO - __main__ - Step 12370: {'lr': 0.0004939687673587346, 'samples': 2375040, 'steps': 12369, 'loss/train': 1.79799222946167}}} +11/06/2021 22:57:31 - INFO - __main__ - Step 12375: {'lr': 0.0004939629728856817, 'samples': 2376000, 'steps': 12374, 'loss/train': 1.2412973642349243} +11/06/2021 22:57:34 - INFO - __main__ - Step 12380: {'lr': 0.0004939571756644799, 'samples': 2376960, 'steps': 12379, 'loss/train': 1.6386349201202393} +11/06/2021 22:57:34 - INFO - __main__ - Step 12380: {'lr': 0.0004939571756644799, 'samples': 2376960, 'steps': 12379, 'loss/train': 1.6386349201202393} +11/06/2021 22:57:37 - INFO - __main__ - Step 12386: {'lr': 0.0004939502153715733, 'samples': 2378112, 'steps': 12385, 'loss/train': 1.881219744682312}} +11/06/2021 22:57:40 - INFO - __main__ - Step 12391: {'lr': 0.0004939444121046741, 'samples': 2379072, 'steps': 12390, 'loss/train': 1.171319603919983}} +11/06/2021 22:57:42 - INFO - __main__ - Step 12395: {'lr': 0.000493939767512635, 'samples': 2379840, 'steps': 12394, 'loss/train': 1.767325758934021}}} +11/06/2021 22:57:42 - INFO - __main__ - Step 12395: {'lr': 0.000493939767512635, 'samples': 2379840, 'steps': 12394, 'loss/train': 1.767325758934021}}} +11/06/2021 22:57:45 - INFO - __main__ - Step 12402: {'lr': 0.0004939316352448403, 'samples': 2381184, 'steps': 12401, 'loss/train': 1.0791970491409302} +11/06/2021 22:57:48 - INFO - __main__ - Step 12408: {'lr': 0.0004939246604430195, 'samples': 2382336, 'steps': 12407, 'loss/train': 1.8069547414779663} +11/06/2021 22:57:50 - INFO - __main__ - Step 12413: {'lr': 0.000493918845085675, 'samples': 2383296, 'steps': 12412, 'loss/train': 1.7577980756759644}} +11/06/2021 22:57:50 - INFO - __main__ - Step 12413: {'lr': 0.000493918845085675, 'samples': 2383296, 'steps': 12412, 'loss/train': 1.7577980756759644}} +11/06/2021 22:57:53 - INFO - __main__ - Step 12419: {'lr': 0.0004939118630299672, 'samples': 2384448, 'steps': 12418, 'loss/train': 1.799317479133606}} +11/06/2021 22:57:55 - INFO - __main__ - Step 12423: {'lr': 0.0004939072061280967, 'samples': 2385216, 'steps': 12422, 'loss/train': 1.4663667678833008} +11/06/2021 22:57:58 - INFO - __main__ - Step 12428: {'lr': 0.0004939013825279939, 'samples': 2386176, 'steps': 12427, 'loss/train': 1.5649765729904175} +11/06/2021 22:58:00 - INFO - __main__ - Step 12433: {'lr': 0.0004938955561804361, 'samples': 2387136, 'steps': 12432, 'loss/train': 1.6927978992462158} +11/06/2021 22:58:00 - INFO - __main__ - Step 12433: {'lr': 0.0004938955561804361, 'samples': 2387136, 'steps': 12432, 'loss/train': 1.6927978992462158} +11/06/2021 22:58:03 - INFO - __main__ - Step 12440: {'lr': 0.0004938873946782557, 'samples': 2388480, 'steps': 12439, 'loss/train': 1.3930256366729736} +11/06/2021 22:58:05 - INFO - __main__ - Step 12444: {'lr': 0.0004938827285450908, 'samples': 2389248, 'steps': 12443, 'loss/train': 1.6230531930923462} +11/06/2021 22:58:08 - INFO - __main__ - Step 12449: {'lr': 0.0004938768934061182, 'samples': 2390208, 'steps': 12448, 'loss/train': 1.9037350416183472} +11/06/2021 22:58:10 - INFO - __main__ - Step 12453: {'lr': 0.000493872223316968, 'samples': 2390976, 'steps': 12452, 'loss/train': 1.4199427366256714}} +11/06/2021 22:58:10 - INFO - __main__ - Step 12453: {'lr': 0.000493872223316968, 'samples': 2390976, 'steps': 12452, 'loss/train': 1.4199427366256714}} +11/06/2021 22:58:13 - INFO - __main__ - Step 12460: {'lr': 0.0004938640464304006, 'samples': 2392320, 'steps': 12459, 'loss/train': 1.7510279417037964} +11/06/2021 22:58:15 - INFO - __main__ - Step 12464: {'lr': 0.0004938593715063888, 'samples': 2393088, 'steps': 12463, 'loss/train': 1.430334448814392}} +11/06/2021 22:58:18 - INFO - __main__ - Step 12469: {'lr': 0.0004938535253790944, 'samples': 2394048, 'steps': 12468, 'loss/train': 1.569968342781067}} +11/06/2021 22:58:20 - INFO - __main__ - Step 12473: {'lr': 0.0004938488464994764, 'samples': 2394816, 'steps': 12472, 'loss/train': 1.2448487281799316} +11/06/2021 22:58:22 - INFO - __main__ - Step 12477: {'lr': 0.0004938441658618659, 'samples': 2395584, 'steps': 12476, 'loss/train': 1.6196297407150269} +11/06/2021 22:58:23 - INFO - __main__ - Step 12481: {'lr': 0.0004938394834662966, 'samples': 2396352, 'steps': 12480, 'loss/train': 0.9850826859474182} +11/06/2021 22:58:25 - INFO - __main__ - Step 12485: {'lr': 0.0004938347993128025, 'samples': 2397120, 'steps': 12484, 'loss/train': 1.588280439376831}} +11/06/2021 22:58:28 - INFO - __main__ - Step 12490: {'lr': 0.0004938289416489042, 'samples': 2398080, 'steps': 12489, 'loss/train': 2.0924293994903564} +11/06/2021 22:58:30 - INFO - __main__ - Step 12494: {'lr': 0.0004938242535402025, 'samples': 2398848, 'steps': 12493, 'loss/train': 1.4478893280029297} +11/06/2021 22:58:30 - INFO - __main__ - Step 12494: {'lr': 0.0004938242535402025, 'samples': 2398848, 'steps': 12493, 'loss/train': 1.4478893280029297} +11/06/2021 22:58:34 - INFO - __main__ - Step 12501: {'lr': 0.000493816045120252, 'samples': 2400192, 'steps': 12500, 'loss/train': 1.6998056173324585}} +11/06/2021 22:58:36 - INFO - __main__ - Step 12506: {'lr': 0.0004938101786673416, 'samples': 2401152, 'steps': 12505, 'loss/train': 1.861094355583191}} +11/06/2021 22:58:38 - INFO - __main__ - Step 12511: {'lr': 0.0004938043094680036, 'samples': 2402112, 'steps': 12510, 'loss/train': 1.6733269691467285} +11/06/2021 22:58:38 - INFO - __main__ - Step 12511: {'lr': 0.0004938043094680036, 'samples': 2402112, 'steps': 12510, 'loss/train': 1.6733269691467285} +11/06/2021 22:58:42 - INFO - __main__ - Step 12518: {'lr': 0.0004937960879750578, 'samples': 2403456, 'steps': 12517, 'loss/train': 1.5596864223480225} +11/06/2021 22:58:44 - INFO - __main__ - Step 12522: {'lr': 0.0004937913875623605, 'samples': 2404224, 'steps': 12521, 'loss/train': 1.12235426902771}5} +11/06/2021 22:58:46 - INFO - __main__ - Step 12527: {'lr': 0.0004937855095748985, 'samples': 2405184, 'steps': 12526, 'loss/train': 1.8808726072311401} +11/06/2021 22:58:46 - INFO - __main__ - Step 12527: {'lr': 0.0004937855095748985, 'samples': 2405184, 'steps': 12526, 'loss/train': 1.8808726072311401} +11/06/2021 22:58:50 - INFO - __main__ - Step 12534: {'lr': 0.0004937772757789352, 'samples': 2406528, 'steps': 12533, 'loss/train': 0.9707418084144592} +11/06/2021 22:58:52 - INFO - __main__ - Step 12538: {'lr': 0.0004937725683361286, 'samples': 2407296, 'steps': 12537, 'loss/train': 1.6391980648040771} +11/06/2021 22:58:54 - INFO - __main__ - Step 12543: {'lr': 0.0004937666815612207, 'samples': 2408256, 'steps': 12542, 'loss/train': 1.523587703704834}} +11/06/2021 22:58:56 - INFO - __main__ - Step 12547: {'lr': 0.0004937619701642162, 'samples': 2409024, 'steps': 12546, 'loss/train': 2.321528434753418}} +11/06/2021 22:58:58 - INFO - __main__ - Step 12551: {'lr': 0.0004937572570098455, 'samples': 2409792, 'steps': 12550, 'loss/train': 1.5153863430023193} +11/06/2021 22:59:00 - INFO - __main__ - Step 12555: {'lr': 0.0004937525420981428, 'samples': 2410560, 'steps': 12554, 'loss/train': 2.261537790298462}} +11/06/2021 22:59:02 - INFO - __main__ - Step 12559: {'lr': 0.0004937478254291418, 'samples': 2411328, 'steps': 12558, 'loss/train': 1.6904947757720947} +11/06/2021 22:59:04 - INFO - __main__ - Step 12564: {'lr': 0.0004937419271217419, 'samples': 2412288, 'steps': 12563, 'loss/train': 5.857589244842529}} +11/06/2021 22:59:06 - INFO - __main__ - Step 12568: {'lr': 0.0004937372064989445, 'samples': 2413056, 'steps': 12567, 'loss/train': 1.3068746328353882} +11/06/2021 22:59:08 - INFO - __main__ - Step 12572: {'lr': 0.0004937324841189595, 'samples': 2413824, 'steps': 12571, 'loss/train': 1.9527837038040161} +11/06/2021 22:59:10 - INFO - __main__ - Step 12576: {'lr': 0.000493727759981821, 'samples': 2414592, 'steps': 12575, 'loss/train': 1.5525745153427124}} +11/06/2021 22:59:12 - INFO - __main__ - Step 12580: {'lr': 0.000493723034087563, 'samples': 2415360, 'steps': 12579, 'loss/train': 0.8102706074714661}} +11/06/2021 22:59:14 - INFO - __main__ - Step 12584: {'lr': 0.0004937183064362196, 'samples': 2416128, 'steps': 12583, 'loss/train': 1.7389198541641235} +11/06/2021 22:59:16 - INFO - __main__ - Step 12588: {'lr': 0.0004937135770278248, 'samples': 2416896, 'steps': 12587, 'loss/train': 1.688107967376709}} +11/06/2021 22:59:18 - INFO - __main__ - Step 12592: {'lr': 0.0004937088458624128, 'samples': 2417664, 'steps': 12591, 'loss/train': 1.8203307390213013} +11/06/2021 22:59:20 - INFO - __main__ - Step 12596: {'lr': 0.0004937041129400177, 'samples': 2418432, 'steps': 12595, 'loss/train': 2.0309805870056152} +11/06/2021 22:59:22 - INFO - __main__ - Step 12601: {'lr': 0.0004936981943163182, 'samples': 2419392, 'steps': 12600, 'loss/train': 1.7093287706375122} +11/06/2021 22:59:24 - INFO - __main__ - Step 12605: {'lr': 0.000493693457440836, 'samples': 2420160, 'steps': 12604, 'loss/train': 2.0806899070739746}} +11/06/2021 22:59:26 - INFO - __main__ - Step 12609: {'lr': 0.0004936887188084813, 'samples': 2420928, 'steps': 12608, 'loss/train': 1.5434484481811523} +11/06/2021 22:59:28 - INFO - __main__ - Step 12613: {'lr': 0.0004936839784192888, 'samples': 2421696, 'steps': 12612, 'loss/train': 1.6676959991455078} +11/06/2021 22:59:30 - INFO - __main__ - Step 12617: {'lr': 0.0004936792362732924, 'samples': 2422464, 'steps': 12616, 'loss/train': 1.7673671245574951} +11/06/2021 22:59:32 - INFO - __main__ - Step 12622: {'lr': 0.0004936733061203435, 'samples': 2423424, 'steps': 12621, 'loss/train': 1.8702856302261353} +11/06/2021 22:59:34 - INFO - __main__ - Step 12626: {'lr': 0.0004936685600216635, 'samples': 2424192, 'steps': 12625, 'loss/train': 1.8777118921279907} +11/06/2021 22:59:34 - INFO - __main__ - Step 12626: {'lr': 0.0004936685600216635, 'samples': 2424192, 'steps': 12625, 'loss/train': 1.8777118921279907} +11/06/2021 22:59:38 - INFO - __main__ - Step 12633: {'lr': 0.0004936602501219522, 'samples': 2425536, 'steps': 12632, 'loss/train': 1.7763961553573608} +11/06/2021 22:59:40 - INFO - __main__ - Step 12638: {'lr': 0.0004936543111856041, 'samples': 2426496, 'steps': 12637, 'loss/train': 1.6684590578079224} +11/06/2021 22:59:40 - INFO - __main__ - Step 12638: {'lr': 0.0004936543111856041, 'samples': 2426496, 'steps': 12637, 'loss/train': 1.6684590578079224} +11/06/2021 22:59:44 - INFO - __main__ - Step 12646: {'lr': 0.0004936448031785576, 'samples': 2428032, 'steps': 12645, 'loss/train': 1.5351349115371704} +11/06/2021 22:59:47 - INFO - __main__ - Step 12650: {'lr': 0.0004936400465402351, 'samples': 2428800, 'steps': 12649, 'loss/train': 1.8610800504684448} +11/06/2021 22:59:48 - INFO - __main__ - Step 12654: {'lr': 0.0004936352881454256, 'samples': 2429568, 'steps': 12653, 'loss/train': 1.6259452104568481} +11/06/2021 22:59:50 - INFO - __main__ - Step 12658: {'lr': 0.000493630527994163, 'samples': 2430336, 'steps': 12657, 'loss/train': 1.9009116888046265}} +11/06/2021 22:59:53 - INFO - __main__ - Step 12663: {'lr': 0.0004936245753351256, 'samples': 2431296, 'steps': 12662, 'loss/train': 1.9647890329360962} +11/06/2021 22:59:55 - INFO - __main__ - Step 12667: {'lr': 0.0004936198112319698, 'samples': 2432064, 'steps': 12666, 'loss/train': 1.6497493982315063} +11/06/2021 22:59:55 - INFO - __main__ - Step 12667: {'lr': 0.0004936198112319698, 'samples': 2432064, 'steps': 12666, 'loss/train': 1.6497493982315063} +11/06/2021 22:59:58 - INFO - __main__ - Step 12674: {'lr': 0.0004936114698252717, 'samples': 2433408, 'steps': 12673, 'loss/train': 1.5145035982131958} +11/06/2021 23:00:00 - INFO - __main__ - Step 12679: {'lr': 0.0004936055083845924, 'samples': 2434368, 'steps': 12678, 'loss/train': 1.7321808338165283} +11/06/2021 23:00:03 - INFO - __main__ - Step 12683: {'lr': 0.0004936007372562778, 'samples': 2435136, 'steps': 12682, 'loss/train': 1.703395128250122}} +11/06/2021 23:00:05 - INFO - __main__ - Step 12687: {'lr': 0.0004935959643717595, 'samples': 2435904, 'steps': 12686, 'loss/train': 1.3232539892196655} +11/06/2021 23:00:07 - INFO - __main__ - Step 12691: {'lr': 0.0004935911897310719, 'samples': 2436672, 'steps': 12690, 'loss/train': 1.8013556003570557} +11/06/2021 23:00:08 - INFO - __main__ - Step 12695: {'lr': 0.0004935864133342495, 'samples': 2437440, 'steps': 12694, 'loss/train': 1.6431411504745483} +11/06/2021 23:00:10 - INFO - __main__ - Step 12699: {'lr': 0.0004935816351813265, 'samples': 2438208, 'steps': 12698, 'loss/train': 1.92881441116333}3} +11/06/2021 23:00:13 - INFO - __main__ - Step 12704: {'lr': 0.000493575660020709, 'samples': 2439168, 'steps': 12703, 'loss/train': 1.6965235471725464}} +11/06/2021 23:00:15 - INFO - __main__ - Step 12708: {'lr': 0.0004935708779166859, 'samples': 2439936, 'steps': 12707, 'loss/train': 1.2805671691894531} +11/06/2021 23:00:17 - INFO - __main__ - Step 12712: {'lr': 0.0004935660940566744, 'samples': 2440704, 'steps': 12711, 'loss/train': 1.640486240386963}} +11/06/2021 23:00:18 - INFO - __main__ - Step 12716: {'lr': 0.000493561308440709, 'samples': 2441472, 'steps': 12715, 'loss/train': 1.336901068687439}}} +11/06/2021 23:00:20 - INFO - __main__ - Step 12720: {'lr': 0.000493556521068824, 'samples': 2442240, 'steps': 12719, 'loss/train': 1.883273720741272}}} +11/06/2021 23:00:23 - INFO - __main__ - Step 12725: {'lr': 0.0004935505343847586, 'samples': 2443200, 'steps': 12724, 'loss/train': 1.665300965309143}} +11/06/2021 23:00:25 - INFO - __main__ - Step 12729: {'lr': 0.000493545743062181, 'samples': 2443968, 'steps': 12728, 'loss/train': 1.831040382385254}}} +11/06/2021 23:00:27 - INFO - __main__ - Step 12733: {'lr': 0.0004935409499837962, 'samples': 2444736, 'steps': 12732, 'loss/train': 2.449708938598633}} +11/06/2021 23:00:28 - INFO - __main__ - Step 12737: {'lr': 0.0004935361551496387, 'samples': 2445504, 'steps': 12736, 'loss/train': 1.5406252145767212} +11/06/2021 23:00:30 - INFO - __main__ - Step 12741: {'lr': 0.000493531358559743, 'samples': 2446272, 'steps': 12740, 'loss/train': 1.849948525428772}2} +11/06/2021 23:00:33 - INFO - __main__ - Step 12746: {'lr': 0.0004935253603534193, 'samples': 2447232, 'steps': 12745, 'loss/train': 1.745668649673462}} +11/06/2021 23:00:35 - INFO - __main__ - Step 12750: {'lr': 0.0004935205598132393, 'samples': 2448000, 'steps': 12749, 'loss/train': 1.637121319770813}} +11/06/2021 23:00:37 - INFO - __main__ - Step 12754: {'lr': 0.0004935157575174336, 'samples': 2448768, 'steps': 12753, 'loss/train': 1.7007369995117188} +11/06/2021 23:00:39 - INFO - __main__ - Step 12758: {'lr': 0.0004935109534660368, 'samples': 2449536, 'steps': 12757, 'loss/train': 1.8127813339233398} +11/06/2021 23:00:40 - INFO - __main__ - Step 12762: {'lr': 0.0004935061476590835, 'samples': 2450304, 'steps': 12761, 'loss/train': 0.9896982908248901} +11/06/2021 23:00:43 - INFO - __main__ - Step 12767: {'lr': 0.0004935001379316935, 'samples': 2451264, 'steps': 12766, 'loss/train': 1.5596141815185547} +11/06/2021 23:00:43 - INFO - __main__ - Step 12767: {'lr': 0.0004935001379316935, 'samples': 2451264, 'steps': 12766, 'loss/train': 1.5596141815185547} +11/06/2021 23:00:43 - INFO - __main__ - Step 12767: {'lr': 0.0004935001379316935, 'samples': 2451264, 'steps': 12766, 'loss/train': 1.5596141815185547} +11/06/2021 23:00:48 - INFO - __main__ - Step 12778: {'lr': 0.0004934869068763992, 'samples': 2453376, 'steps': 12777, 'loss/train': 1.8732150793075562} +11/06/2021 23:00:51 - INFO - __main__ - Step 12783: {'lr': 0.0004934808883718553, 'samples': 2454336, 'steps': 12782, 'loss/train': 1.3475416898727417} +11/06/2021 23:00:53 - INFO - __main__ - Step 12787: {'lr': 0.0004934760715934597, 'samples': 2455104, 'steps': 12786, 'loss/train': 1.5334937572479248} +11/06/2021 23:00:55 - INFO - __main__ - Step 12792: {'lr': 0.0004934700481520717, 'samples': 2456064, 'steps': 12791, 'loss/train': 1.9511923789978027} +11/06/2021 23:00:55 - INFO - __main__ - Step 12792: {'lr': 0.0004934700481520717, 'samples': 2456064, 'steps': 12791, 'loss/train': 1.9511923789978027} +11/06/2021 23:00:59 - INFO - __main__ - Step 12799: {'lr': 0.0004934616107265821, 'samples': 2457408, 'steps': 12798, 'loss/train': 2.198434591293335}} +11/06/2021 23:01:00 - INFO - __main__ - Step 12803: {'lr': 0.0004934567869271751, 'samples': 2458176, 'steps': 12802, 'loss/train': 1.9801455736160278} +11/06/2021 23:01:03 - INFO - __main__ - Step 12808: {'lr': 0.0004934507547097183, 'samples': 2459136, 'steps': 12807, 'loss/train': 1.6593072414398193} +11/06/2021 23:01:05 - INFO - __main__ - Step 12812: {'lr': 0.000493445926961237, 'samples': 2459904, 'steps': 12811, 'loss/train': 1.6957072019577026}} +11/06/2021 23:01:07 - INFO - __main__ - Step 12816: {'lr': 0.0004934410974576679, 'samples': 2460672, 'steps': 12815, 'loss/train': 1.9368259906768799} +11/06/2021 23:01:09 - INFO - __main__ - Step 12820: {'lr': 0.000493436266199046, 'samples': 2461440, 'steps': 12819, 'loss/train': 1.4729948043823242}} +11/06/2021 23:01:10 - INFO - __main__ - Step 12824: {'lr': 0.0004934314331854061, 'samples': 2462208, 'steps': 12823, 'loss/train': 1.826889157295227}} +11/06/2021 23:01:13 - INFO - __main__ - Step 12828: {'lr': 0.000493426598416783, 'samples': 2462976, 'steps': 12827, 'loss/train': 1.77826988697052}7}} +11/06/2021 23:01:15 - INFO - __main__ - Step 12833: {'lr': 0.0004934205524881123, 'samples': 2463936, 'steps': 12832, 'loss/train': 1.9681713581085205} +11/06/2021 23:01:15 - INFO - __main__ - Step 12833: {'lr': 0.0004934205524881123, 'samples': 2463936, 'steps': 12832, 'loss/train': 1.9681713581085205} +11/06/2021 23:01:18 - INFO - __main__ - Step 12838: {'lr': 0.0004934145038174028, 'samples': 2464896, 'steps': 12837, 'loss/train': 1.6767199039459229} +11/06/2021 23:01:21 - INFO - __main__ - Step 12844: {'lr': 0.0004934072417931564, 'samples': 2466048, 'steps': 12843, 'loss/train': 1.7585923671722412} +11/06/2021 23:01:23 - INFO - __main__ - Step 12848: {'lr': 0.0004934023982501406, 'samples': 2466816, 'steps': 12847, 'loss/train': 1.2807785272598267} +11/06/2021 23:01:25 - INFO - __main__ - Step 12852: {'lr': 0.0004933975529523511, 'samples': 2467584, 'steps': 12851, 'loss/train': 1.6571444272994995} +11/06/2021 23:01:27 - INFO - __main__ - Step 12856: {'lr': 0.0004933927058998226, 'samples': 2468352, 'steps': 12855, 'loss/train': 1.74991774559021}5} +11/06/2021 23:01:29 - INFO - __main__ - Step 12861: {'lr': 0.0004933866446166136, 'samples': 2469312, 'steps': 12860, 'loss/train': 1.84537935256958}5} +11/06/2021 23:01:29 - INFO - __main__ - Step 12861: {'lr': 0.0004933866446166136, 'samples': 2469312, 'steps': 12860, 'loss/train': 1.84537935256958}5} +11/06/2021 23:01:32 - INFO - __main__ - Step 12868: {'lr': 0.0004933781542141532, 'samples': 2470656, 'steps': 12867, 'loss/train': 1.985740303993225}} +11/06/2021 23:01:35 - INFO - __main__ - Step 12872: {'lr': 0.0004933733001430186, 'samples': 2471424, 'steps': 12871, 'loss/train': 1.7198106050491333} +11/06/2021 23:01:37 - INFO - __main__ - Step 12877: {'lr': 0.0004933672300867488, 'samples': 2472384, 'steps': 12876, 'loss/train': 1.5705578327178955} +11/06/2021 23:01:39 - INFO - __main__ - Step 12881: {'lr': 0.0004933623720678944, 'samples': 2473152, 'steps': 12880, 'loss/train': 1.816332459449768}} +11/06/2021 23:01:41 - INFO - __main__ - Step 12885: {'lr': 0.0004933575122945547, 'samples': 2473920, 'steps': 12884, 'loss/train': 1.8801758289337158} +11/06/2021 23:01:43 - INFO - __main__ - Step 12889: {'lr': 0.0004933526507667648, 'samples': 2474688, 'steps': 12888, 'loss/train': 2.223954200744629}} +11/06/2021 23:01:45 - INFO - __main__ - Step 12893: {'lr': 0.0004933477874845595, 'samples': 2475456, 'steps': 12892, 'loss/train': 1.9039117097854614} +11/06/2021 23:01:47 - INFO - __main__ - Step 12897: {'lr': 0.0004933429224479743, 'samples': 2476224, 'steps': 12896, 'loss/train': 1.6877235174179077} +11/06/2021 23:01:47 - INFO - __main__ - Step 12897: {'lr': 0.0004933429224479743, 'samples': 2476224, 'steps': 12896, 'loss/train': 1.6877235174179077} +11/06/2021 23:01:51 - INFO - __main__ - Step 12903: {'lr': 0.0004933356216037104, 'samples': 2477376, 'steps': 12902, 'loss/train': 1.398972749710083}} +11/06/2021 23:01:53 - INFO - __main__ - Step 12908: {'lr': 0.0004933295345516287, 'samples': 2478336, 'steps': 12907, 'loss/train': 1.5094048976898193} +11/06/2021 23:01:55 - INFO - __main__ - Step 12913: {'lr': 0.0004933234447585337, 'samples': 2479296, 'steps': 12912, 'loss/train': 1.6900960206985474} +11/06/2021 23:01:55 - INFO - __main__ - Step 12913: {'lr': 0.0004933234447585337, 'samples': 2479296, 'steps': 12912, 'loss/train': 1.6900960206985474} +11/06/2021 23:01:55 - INFO - __main__ - Step 12913: {'lr': 0.0004933234447585337, 'samples': 2479296, 'steps': 12912, 'loss/train': 1.6900960206985474} +11/06/2021 23:02:01 - INFO - __main__ - Step 12923: {'lr': 0.000493311256949578, 'samples': 2481216, 'steps': 12922, 'loss/train': 1.5766397714614868}} +11/06/2021 23:02:03 - INFO - __main__ - Step 12928: {'lr': 0.0004933051589338547, 'samples': 2482176, 'steps': 12927, 'loss/train': 1.815047025680542}} +11/06/2021 23:02:03 - INFO - __main__ - Step 12928: {'lr': 0.0004933051589338547, 'samples': 2482176, 'steps': 12927, 'loss/train': 1.815047025680542}} +11/06/2021 23:02:07 - INFO - __main__ - Step 12936: {'lr': 0.0004932953964079893, 'samples': 2483712, 'steps': 12935, 'loss/train': 1.569036841392517}} +11/06/2021 23:02:09 - INFO - __main__ - Step 12940: {'lr': 0.0004932905125140354, 'samples': 2484480, 'steps': 12939, 'loss/train': 1.5175234079360962} +11/06/2021 23:02:11 - INFO - __main__ - Step 12944: {'lr': 0.0004932856268661143, 'samples': 2485248, 'steps': 12943, 'loss/train': 1.5122387409210205} +11/06/2021 23:02:13 - INFO - __main__ - Step 12949: {'lr': 0.0004932795173397501, 'samples': 2486208, 'steps': 12948, 'loss/train': 2.574796199798584}} +11/06/2021 23:02:16 - INFO - __main__ - Step 12954: {'lr': 0.0004932734050729362, 'samples': 2487168, 'steps': 12953, 'loss/train': 1.2582000494003296} +11/06/2021 23:02:18 - INFO - __main__ - Step 12958: {'lr': 0.0004932685132864072, 'samples': 2487936, 'steps': 12957, 'loss/train': 1.3571699857711792} +11/06/2021 23:02:18 - INFO - __main__ - Step 12958: {'lr': 0.0004932685132864072, 'samples': 2487936, 'steps': 12957, 'loss/train': 1.3571699857711792} +11/06/2021 23:02:21 - INFO - __main__ - Step 12965: {'lr': 0.000493259948439901, 'samples': 2489280, 'steps': 12964, 'loss/train': 1.8154479265213013}} +11/06/2021 23:02:23 - INFO - __main__ - Step 12970: {'lr': 0.0004932538274041101, 'samples': 2490240, 'steps': 12969, 'loss/train': 1.741576910018921}} +11/06/2021 23:02:23 - INFO - __main__ - Step 12970: {'lr': 0.0004932538274041101, 'samples': 2490240, 'steps': 12969, 'loss/train': 1.741576910018921}} +11/06/2021 23:02:27 - INFO - __main__ - Step 12977: {'lr': 0.0004932452533505486, 'samples': 2491584, 'steps': 12976, 'loss/train': 1.471701979637146}} +11/06/2021 23:02:29 - INFO - __main__ - Step 12982: {'lr': 0.0004932391257384883, 'samples': 2492544, 'steps': 12981, 'loss/train': 1.9861183166503906} +11/06/2021 23:02:32 - INFO - __main__ - Step 12987: {'lr': 0.0004932329953864331, 'samples': 2493504, 'steps': 12986, 'loss/train': 1.9840530157089233} +11/06/2021 23:02:32 - INFO - __main__ - Step 12987: {'lr': 0.0004932329953864331, 'samples': 2493504, 'steps': 12986, 'loss/train': 1.9840530157089233} +11/06/2021 23:02:36 - INFO - __main__ - Step 12994: {'lr': 0.0004932244082904959, 'samples': 2494848, 'steps': 12993, 'loss/train': 1.4867180585861206} +11/06/2021 23:02:37 - INFO - __main__ - Step 12998: {'lr': 0.00049321949896747, 'samples': 2495616, 'steps': 12997, 'loss/train': 1.4822603464126587}6} +11/06/2021 23:02:40 - INFO - __main__ - Step 13002: {'lr': 0.0004932145878909889, 'samples': 2496384, 'steps': 13001, 'loss/train': 1.9297839403152466} +11/06/2021 23:02:42 - INFO - __main__ - Step 13006: {'lr': 0.0004932096750610879, 'samples': 2497152, 'steps': 13005, 'loss/train': 1.8479753732681274} +11/06/2021 23:02:42 - INFO - __main__ - Step 13006: {'lr': 0.0004932096750610879, 'samples': 2497152, 'steps': 13005, 'loss/train': 1.8479753732681274} +11/06/2021 23:02:45 - INFO - __main__ - Step 13013: {'lr': 0.0004932010733897012, 'samples': 2498496, 'steps': 13012, 'loss/train': 1.5579228401184082} +11/06/2021 23:02:48 - INFO - __main__ - Step 13018: {'lr': 0.00049319492605122, 'samples': 2499456, 'steps': 13017, 'loss/train': 1.8722537755966187}2} +11/06/2021 23:02:50 - INFO - __main__ - Step 13022: {'lr': 0.000493190006207994, 'samples': 2500224, 'steps': 13021, 'loss/train': 1.3083375692367554}} +11/06/2021 23:02:52 - INFO - __main__ - Step 13026: {'lr': 0.0004931850846115253, 'samples': 2500992, 'steps': 13025, 'loss/train': 1.7009488344192505} +11/06/2021 23:02:53 - INFO - __main__ - Step 13030: {'lr': 0.0004931801612618494, 'samples': 2501760, 'steps': 13029, 'loss/train': 0.9826458692550659} +11/06/2021 23:02:56 - INFO - __main__ - Step 13034: {'lr': 0.000493175236159002, 'samples': 2502528, 'steps': 13033, 'loss/train': 2.120985269546509}9} +11/06/2021 23:02:58 - INFO - __main__ - Step 13039: {'lr': 0.0004931690773150991, 'samples': 2503488, 'steps': 13038, 'loss/train': 1.3863145112991333} +11/06/2021 23:02:58 - INFO - __main__ - Step 13039: {'lr': 0.0004931690773150991, 'samples': 2503488, 'steps': 13038, 'loss/train': 1.3863145112991333} +11/06/2021 23:03:02 - INFO - __main__ - Step 13046: {'lr': 0.0004931604503317846, 'samples': 2504832, 'steps': 13045, 'loss/train': 1.6171785593032837} +11/06/2021 23:03:04 - INFO - __main__ - Step 13051: {'lr': 0.0004931542849139044, 'samples': 2505792, 'steps': 13050, 'loss/train': 2.8212499618530273} +11/06/2021 23:03:06 - INFO - __main__ - Step 13055: {'lr': 0.0004931493506074886, 'samples': 2506560, 'steps': 13054, 'loss/train': 1.271149754524231}} +11/06/2021 23:03:08 - INFO - __main__ - Step 13059: {'lr': 0.0004931444145481233, 'samples': 2507328, 'steps': 13058, 'loss/train': 1.3444815874099731} +11/06/2021 23:03:10 - INFO - __main__ - Step 13063: {'lr': 0.000493139476735844, 'samples': 2508096, 'steps': 13062, 'loss/train': 2.6808207035064697}} +11/06/2021 23:03:10 - INFO - __main__ - Step 13063: {'lr': 0.000493139476735844, 'samples': 2508096, 'steps': 13062, 'loss/train': 2.6808207035064697}} +11/06/2021 23:03:13 - INFO - __main__ - Step 13070: {'lr': 0.0004931308313465132, 'samples': 2509440, 'steps': 13069, 'loss/train': 1.9141942262649536} +11/06/2021 23:03:16 - INFO - __main__ - Step 13075: {'lr': 0.0004931246527818785, 'samples': 2510400, 'steps': 13074, 'loss/train': 1.26536226272583}6} +11/06/2021 23:03:18 - INFO - __main__ - Step 13080: {'lr': 0.0004931184714785385, 'samples': 2511360, 'steps': 13079, 'loss/train': 1.9777021408081055} +11/06/2021 23:03:18 - INFO - __main__ - Step 13080: {'lr': 0.0004931184714785385, 'samples': 2511360, 'steps': 13079, 'loss/train': 1.9777021408081055} +11/06/2021 23:03:22 - INFO - __main__ - Step 13087: {'lr': 0.0004931098130529699, 'samples': 2512704, 'steps': 13086, 'loss/train': 2.025705099105835}} +11/06/2021 23:03:23 - INFO - __main__ - Step 13091: {'lr': 0.0004931048629712905, 'samples': 2513472, 'steps': 13090, 'loss/train': 1.8698866367340088} +11/06/2021 23:03:25 - INFO - __main__ - Step 13095: {'lr': 0.0004930999111369824, 'samples': 2514240, 'steps': 13094, 'loss/train': 1.6571738719940186} +11/06/2021 23:03:25 - INFO - __main__ - Step 13095: {'lr': 0.0004930999111369824, 'samples': 2514240, 'steps': 13094, 'loss/train': 1.6571738719940186} +11/06/2021 23:03:30 - INFO - __main__ - Step 13104: {'lr': 0.0004930887631019248, 'samples': 2515968, 'steps': 13103, 'loss/train': 1.3024754524230957} +11/06/2021 23:03:32 - INFO - __main__ - Step 13109: {'lr': 0.0004930825659154674, 'samples': 2516928, 'steps': 13108, 'loss/train': 0.959062397480011}} +11/06/2021 23:03:32 - INFO - __main__ - Step 13109: {'lr': 0.0004930825659154674, 'samples': 2516928, 'steps': 13108, 'loss/train': 0.959062397480011}} +11/06/2021 23:03:35 - INFO - __main__ - Step 13116: {'lr': 0.0004930738852542141, 'samples': 2518272, 'steps': 13115, 'loss/train': 1.4143397808074951} +11/06/2021 23:03:38 - INFO - __main__ - Step 13121: {'lr': 0.0004930676814961189, 'samples': 2519232, 'steps': 13120, 'loss/train': 1.5763609409332275} +11/06/2021 23:03:38 - INFO - __main__ - Step 13121: {'lr': 0.0004930676814961189, 'samples': 2519232, 'steps': 13120, 'loss/train': 1.5763609409332275} +11/06/2021 23:03:42 - INFO - __main__ - Step 13127: {'lr': 0.0004930602333721667, 'samples': 2520384, 'steps': 13126, 'loss/train': 1.6020070314407349} +11/06/2021 23:03:44 - INFO - __main__ - Step 13133: {'lr': 0.0004930527813055237, 'samples': 2521536, 'steps': 13132, 'loss/train': 2.1043529510498047} +11/06/2021 23:03:44 - INFO - __main__ - Step 13133: {'lr': 0.0004930527813055237, 'samples': 2521536, 'steps': 13132, 'loss/train': 2.1043529510498047} +11/06/2021 23:03:48 - INFO - __main__ - Step 13140: {'lr': 0.0004930440822448115, 'samples': 2522880, 'steps': 13139, 'loss/train': 1.4115676879882812} +11/06/2021 23:03:50 - INFO - __main__ - Step 13144: {'lr': 0.0004930391089437017, 'samples': 2523648, 'steps': 13143, 'loss/train': 1.7475541830062866} +11/06/2021 23:03:52 - INFO - __main__ - Step 13148: {'lr': 0.0004930341338904371, 'samples': 2524416, 'steps': 13147, 'loss/train': 1.889960765838623}} +11/06/2021 23:03:52 - INFO - __main__ - Step 13148: {'lr': 0.0004930341338904371, 'samples': 2524416, 'steps': 13147, 'loss/train': 1.889960765838623}} +11/06/2021 23:03:56 - INFO - __main__ - Step 13156: {'lr': 0.000493024178527587, 'samples': 2525952, 'steps': 13155, 'loss/train': 2.2869997024536133}} +11/06/2021 23:03:57 - INFO - __main__ - Step 13160: {'lr': 0.0004930191982180734, 'samples': 2526720, 'steps': 13159, 'loss/train': 1.5737640857696533} +11/06/2021 23:03:59 - INFO - __main__ - Step 13164: {'lr': 0.0004930142161565486, 'samples': 2527488, 'steps': 13163, 'loss/train': 2.0381977558135986} +11/06/2021 23:04:02 - INFO - __main__ - Step 13169: {'lr': 0.0004930079861159315, 'samples': 2528448, 'steps': 13168, 'loss/train': 1.3868030309677124} +11/06/2021 23:04:04 - INFO - __main__ - Step 13174: {'lr': 0.000493001753337923, 'samples': 2529408, 'steps': 13173, 'loss/train': 1.542048692703247}4} +11/06/2021 23:04:04 - INFO - __main__ - Step 13174: {'lr': 0.000493001753337923, 'samples': 2529408, 'steps': 13173, 'loss/train': 1.542048692703247}4} +11/06/2021 23:04:07 - INFO - __main__ - Step 13181: {'lr': 0.0004929930228500279, 'samples': 2530752, 'steps': 13180, 'loss/train': 1.5887360572814941} +11/06/2021 23:04:10 - INFO - __main__ - Step 13185: {'lr': 0.0004929880315910338, 'samples': 2531520, 'steps': 13184, 'loss/train': 0.39340120553970337} +11/06/2021 23:04:12 - INFO - __main__ - Step 13190: {'lr': 0.0004929817900538455, 'samples': 2532480, 'steps': 13189, 'loss/train': 1.4178115129470825}} +11/06/2021 23:04:12 - INFO - __main__ - Step 13190: {'lr': 0.0004929817900538455, 'samples': 2532480, 'steps': 13189, 'loss/train': 1.4178115129470825}} +11/06/2021 23:04:15 - INFO - __main__ - Step 13197: {'lr': 0.0004929730473034763, 'samples': 2533824, 'steps': 13196, 'loss/train': 1.561155915260315}}} +11/06/2021 23:04:17 - INFO - __main__ - Step 13201: {'lr': 0.000492968049037552, 'samples': 2534592, 'steps': 13200, 'loss/train': 1.2632533311843872}}} +11/06/2021 23:04:20 - INFO - __main__ - Step 13206: {'lr': 0.0004929617987419039, 'samples': 2535552, 'steps': 13205, 'loss/train': 1.9509419202804565}} +11/06/2021 23:04:22 - INFO - __main__ - Step 13210: {'lr': 0.0004929567965348347, 'samples': 2536320, 'steps': 13209, 'loss/train': 1.7661024332046509}} +11/06/2021 23:04:24 - INFO - __main__ - Step 13214: {'lr': 0.0004929517925762045, 'samples': 2537088, 'steps': 13213, 'loss/train': 1.7152559757232666}} +11/06/2021 23:04:25 - INFO - __main__ - Step 13218: {'lr': 0.0004929467868660487, 'samples': 2537856, 'steps': 13217, 'loss/train': 1.3065961599349976}} +11/06/2021 23:04:28 - INFO - __main__ - Step 13222: {'lr': 0.000492941779404404, 'samples': 2538624, 'steps': 13221, 'loss/train': 1.3217058181762695}}} +11/06/2021 23:04:30 - INFO - __main__ - Step 13227: {'lr': 0.0004929355176143714, 'samples': 2539584, 'steps': 13226, 'loss/train': 1.6296266317367554}} +11/06/2021 23:04:32 - INFO - __main__ - Step 13232: {'lr': 0.0004929292530877638, 'samples': 2540544, 'steps': 13231, 'loss/train': 1.5122207403182983}} +11/06/2021 23:04:32 - INFO - __main__ - Step 13232: {'lr': 0.0004929292530877638, 'samples': 2540544, 'steps': 13231, 'loss/train': 1.5122207403182983}} +11/06/2021 23:04:36 - INFO - __main__ - Step 13239: {'lr': 0.0004929204781532018, 'samples': 2541888, 'steps': 13238, 'loss/train': 1.915743112564087}}} +11/06/2021 23:04:38 - INFO - __main__ - Step 13243: {'lr': 0.0004929154614968315, 'samples': 2542656, 'steps': 13242, 'loss/train': 0.5492236614227295}} +11/06/2021 23:04:40 - INFO - __main__ - Step 13247: {'lr': 0.0004929104430891978, 'samples': 2543424, 'steps': 13246, 'loss/train': 1.5061917304992676}} +11/06/2021 23:04:42 - INFO - __main__ - Step 13252: {'lr': 0.0004929041676169967, 'samples': 2544384, 'steps': 13251, 'loss/train': 1.4510022401809692}} +11/06/2021 23:04:44 - INFO - __main__ - Step 13256: {'lr': 0.0004928991452691528, 'samples': 2545152, 'steps': 13255, 'loss/train': 1.8692861795425415}} +11/06/2021 23:04:44 - INFO - __main__ - Step 13256: {'lr': 0.0004928991452691528, 'samples': 2545152, 'steps': 13255, 'loss/train': 1.8692861795425415}} +11/06/2021 23:04:48 - INFO - __main__ - Step 13263: {'lr': 0.0004928903519467534, 'samples': 2546496, 'steps': 13262, 'loss/train': 2.4009814262390137}} +11/06/2021 23:04:50 - INFO - __main__ - Step 13268: {'lr': 0.0004928840677188918, 'samples': 2547456, 'steps': 13267, 'loss/train': 1.5503804683685303}} +11/06/2021 23:04:50 - INFO - __main__ - Step 13268: {'lr': 0.0004928840677188918, 'samples': 2547456, 'steps': 13267, 'loss/train': 1.5503804683685303}} +11/06/2021 23:04:54 - INFO - __main__ - Step 13276: {'lr': 0.0004928740072634722, 'samples': 2548992, 'steps': 13275, 'loss/train': 2.0685250759124756}} +11/06/2021 23:04:56 - INFO - __main__ - Step 13280: {'lr': 0.0004928689744092976, 'samples': 2549760, 'steps': 13279, 'loss/train': 1.8017091751098633}} +11/06/2021 23:04:58 - INFO - __main__ - Step 13284: {'lr': 0.0004928639398041948, 'samples': 2550528, 'steps': 13283, 'loss/train': 1.974739670753479}}} +11/06/2021 23:05:00 - INFO - __main__ - Step 13288: {'lr': 0.0004928589034482001, 'samples': 2551296, 'steps': 13287, 'loss/train': 1.8625463247299194}} +11/06/2021 23:05:03 - INFO - __main__ - Step 13294: {'lr': 0.0004928513456313653, 'samples': 2552448, 'steps': 13293, 'loss/train': 1.6685292720794678}} +11/06/2021 23:05:03 - INFO - __main__ - Step 13294: {'lr': 0.0004928513456313653, 'samples': 2552448, 'steps': 13293, 'loss/train': 1.6685292720794678}} +11/06/2021 23:05:07 - INFO - __main__ - Step 13301: {'lr': 0.0004928425231995593, 'samples': 2553792, 'steps': 13300, 'loss/train': 1.7554380893707275}} +11/06/2021 23:05:08 - INFO - __main__ - Step 13305: {'lr': 0.0004928374794026792, 'samples': 2554560, 'steps': 13304, 'loss/train': 1.3994184732437134}} +11/06/2021 23:05:10 - INFO - __main__ - Step 13309: {'lr': 0.000492832433855098, 'samples': 2555328, 'steps': 13308, 'loss/train': 1.3893240690231323}}} +11/06/2021 23:05:13 - INFO - __main__ - Step 13314: {'lr': 0.0004928261244587536, 'samples': 2556288, 'steps': 13313, 'loss/train': 1.8624576330184937}} +11/06/2021 23:05:15 - INFO - __main__ - Step 13319: {'lr': 0.0004928198123270664, 'samples': 2557248, 'steps': 13318, 'loss/train': 1.5688247680664062}} +11/06/2021 23:05:15 - INFO - __main__ - Step 13319: {'lr': 0.0004928198123270664, 'samples': 2557248, 'steps': 13318, 'loss/train': 1.5688247680664062}} +11/06/2021 23:05:18 - INFO - __main__ - Step 13326: {'lr': 0.0004928109707474643, 'samples': 2558592, 'steps': 13325, 'loss/train': 1.6393741369247437}} +11/06/2021 23:05:20 - INFO - __main__ - Step 13330: {'lr': 0.0004928059160092993, 'samples': 2559360, 'steps': 13329, 'loss/train': 1.7646552324295044}} +11/06/2021 23:05:23 - INFO - __main__ - Step 13335: {'lr': 0.0004927995951249937, 'samples': 2560320, 'steps': 13334, 'loss/train': 1.3417226076126099}} +11/06/2021 23:05:23 - INFO - __main__ - Step 13335: {'lr': 0.0004927995951249937, 'samples': 2560320, 'steps': 13334, 'loss/train': 1.3417226076126099}} +11/06/2021 23:05:26 - INFO - __main__ - Step 13341: {'lr': 0.0004927920064535756, 'samples': 2561472, 'steps': 13340, 'loss/train': 1.808425784111023}}} +11/06/2021 23:05:28 - INFO - __main__ - Step 13345: {'lr': 0.0004927869451513226, 'samples': 2562240, 'steps': 13344, 'loss/train': 1.5792934894561768}} +11/06/2021 23:05:30 - INFO - __main__ - Step 13350: {'lr': 0.0004927806160620995, 'samples': 2563200, 'steps': 13349, 'loss/train': 2.182821750640869}}} +11/06/2021 23:05:33 - INFO - __main__ - Step 13355: {'lr': 0.0004927742842380465, 'samples': 2564160, 'steps': 13354, 'loss/train': 2.1269948482513428}} +11/06/2021 23:05:33 - INFO - __main__ - Step 13355: {'lr': 0.0004927742842380465, 'samples': 2564160, 'steps': 13354, 'loss/train': 2.1269948482513428}} +11/06/2021 23:05:36 - INFO - __main__ - Step 13362: {'lr': 0.0004927654150899937, 'samples': 2565504, 'steps': 13361, 'loss/train': 2.3916163444519043}} +11/06/2021 23:05:38 - INFO - __main__ - Step 13366: {'lr': 0.0004927603445988797, 'samples': 2566272, 'steps': 13365, 'loss/train': 1.918675422668457}}} +11/06/2021 23:05:40 - INFO - __main__ - Step 13370: {'lr': 0.0004927552723576207, 'samples': 2567040, 'steps': 13369, 'loss/train': 1.939740777015686}}} +11/06/2021 23:05:42 - INFO - __main__ - Step 13375: {'lr': 0.0004927489295949613, 'samples': 2568000, 'steps': 13374, 'loss/train': 1.403855562210083}}} +11/06/2021 23:05:42 - INFO - __main__ - Step 13375: {'lr': 0.0004927489295949613, 'samples': 2568000, 'steps': 13374, 'loss/train': 1.403855562210083}}} +11/06/2021 23:05:46 - INFO - __main__ - Step 13383: {'lr': 0.0004927387754870321, 'samples': 2569536, 'steps': 13382, 'loss/train': 0.35177692770957947} +11/06/2021 23:05:48 - INFO - __main__ - Step 13387: {'lr': 0.0004927336958080648, 'samples': 2570304, 'steps': 13386, 'loss/train': 1.88877272605896}47} +11/06/2021 23:05:50 - INFO - __main__ - Step 13391: {'lr': 0.0004927286143791447, 'samples': 2571072, 'steps': 13390, 'loss/train': 2.0183682441711426}} +11/06/2021 23:05:52 - INFO - __main__ - Step 13396: {'lr': 0.0004927222601321789, 'samples': 2572032, 'steps': 13395, 'loss/train': 2.6536405086517334}} +11/06/2021 23:05:52 - INFO - __main__ - Step 13396: {'lr': 0.0004927222601321789, 'samples': 2572032, 'steps': 13395, 'loss/train': 2.6536405086517334}} +11/06/2021 23:05:57 - INFO - __main__ - Step 13403: {'lr': 0.000492713359593033, 'samples': 2573376, 'steps': 13402, 'loss/train': 1.8210397958755493}}} +11/06/2021 23:05:58 - INFO - __main__ - Step 13407: {'lr': 0.0004927082711646676, 'samples': 2574144, 'steps': 13406, 'loss/train': 1.7488776445388794}} +11/06/2021 23:06:00 - INFO - __main__ - Step 13412: {'lr': 0.0004927019081686015, 'samples': 2575104, 'steps': 13411, 'loss/train': 1.4143866300582886}} +11/06/2021 23:06:02 - INFO - __main__ - Step 13416: {'lr': 0.000492696815803306, 'samples': 2575872, 'steps': 13415, 'loss/train': 1.7381833791732788}}} +11/06/2021 23:06:05 - INFO - __main__ - Step 13420: {'lr': 0.0004926917216883235, 'samples': 2576640, 'steps': 13419, 'loss/train': 1.7219598293304443}} +11/06/2021 23:06:07 - INFO - __main__ - Step 13424: {'lr': 0.0004926866258236907, 'samples': 2577408, 'steps': 13423, 'loss/train': 2.304779529571533}}} +11/06/2021 23:06:08 - INFO - __main__ - Step 13428: {'lr': 0.0004926815282094443, 'samples': 2578176, 'steps': 13427, 'loss/train': 2.2351608276367188}} +11/06/2021 23:06:10 - INFO - __main__ - Step 13432: {'lr': 0.0004926764288456212, 'samples': 2578944, 'steps': 13431, 'loss/train': 1.6883317232131958}} +11/06/2021 23:06:13 - INFO - __main__ - Step 13437: {'lr': 0.0004926700521805557, 'samples': 2579904, 'steps': 13436, 'loss/train': 1.5972094535827637}} +11/06/2021 23:06:15 - INFO - __main__ - Step 13441: {'lr': 0.000492664948880319, 'samples': 2580672, 'steps': 13440, 'loss/train': 1.513269305229187}7}} +11/06/2021 23:06:17 - INFO - __main__ - Step 13445: {'lr': 0.0004926598438306252, 'samples': 2581440, 'steps': 13444, 'loss/train': 1.1700359582901}}7}} +11/06/2021 23:06:17 - INFO - __main__ - Step 13445: {'lr': 0.0004926598438306252, 'samples': 2581440, 'steps': 13444, 'loss/train': 1.1700359582901}}7}} +11/06/2021 23:06:20 - INFO - __main__ - Step 13452: {'lr': 0.0004926509057841397, 'samples': 2582784, 'steps': 13451, 'loss/train': 2.232959032058716}}} +11/06/2021 23:06:23 - INFO - __main__ - Step 13458: {'lr': 0.0004926432403373752, 'samples': 2583936, 'steps': 13457, 'loss/train': 2.219507932662964}}} +11/06/2021 23:06:23 - INFO - __main__ - Step 13458: {'lr': 0.0004926432403373752, 'samples': 2583936, 'steps': 13457, 'loss/train': 2.219507932662964}}} +11/06/2021 23:06:26 - INFO - __main__ - Step 13465: {'lr': 0.0004926342923415844, 'samples': 2585280, 'steps': 13464, 'loss/train': 1.8750228881835938}} +11/06/2021 23:06:28 - INFO - __main__ - Step 13469: {'lr': 0.0004926291767959199, 'samples': 2586048, 'steps': 13468, 'loss/train': 3.767948865890503}}} +11/06/2021 23:06:31 - INFO - __main__ - Step 13474: {'lr': 0.000492622779904032, 'samples': 2587008, 'steps': 13473, 'loss/train': 1.531381368637085}}}} +11/06/2021 23:06:33 - INFO - __main__ - Step 13478: {'lr': 0.0004926176604227208, 'samples': 2587776, 'steps': 13477, 'loss/train': 1.7047059535980225}} +11/06/2021 23:06:33 - INFO - __main__ - Step 13478: {'lr': 0.0004926176604227208, 'samples': 2587776, 'steps': 13477, 'loss/train': 1.7047059535980225}} +11/06/2021 23:06:36 - INFO - __main__ - Step 13485: {'lr': 0.0004926086971216371, 'samples': 2589120, 'steps': 13484, 'loss/train': 1.7945960760116577}} +11/06/2021 23:06:36 - INFO - __main__ - Step 13485: {'lr': 0.0004926086971216371, 'samples': 2589120, 'steps': 13484, 'loss/train': 1.7945960760116577}} +11/06/2021 23:06:36 - INFO - __main__ - Step 13485: {'lr': 0.0004926086971216371, 'samples': 2589120, 'steps': 13484, 'loss/train': 1.7945960760116577}} +11/06/2021 23:06:42 - INFO - __main__ - Step 13496: {'lr': 0.0004925946011120382, 'samples': 2591232, 'steps': 13495, 'loss/train': 2.3239166736602783}} +11/06/2021 23:06:44 - INFO - __main__ - Step 13500: {'lr': 0.000492589472011044, 'samples': 2592000, 'steps': 13499, 'loss/train': 2.0992441177368164}}} +11/06/2021 23:06:47 - INFO - __main__ - Step 13505: {'lr': 0.0004925830581753964, 'samples': 2592960, 'steps': 13504, 'loss/train': 2.066511631011963}}} +11/06/2021 23:06:49 - INFO - __main__ - Step 13509: {'lr': 0.0004925779251393995, 'samples': 2593728, 'steps': 13508, 'loss/train': 2.0398895740509033}} +11/06/2021 23:06:51 - INFO - __main__ - Step 13513: {'lr': 0.0004925727903545727, 'samples': 2594496, 'steps': 13512, 'loss/train': 1.662975788116455}}} +11/06/2021 23:06:52 - INFO - __main__ - Step 13517: {'lr': 0.0004925676538209531, 'samples': 2595264, 'steps': 13516, 'loss/train': 2.147181510925293}}} +11/06/2021 23:06:54 - INFO - __main__ - Step 13521: {'lr': 0.0004925625155385775, 'samples': 2596032, 'steps': 13520, 'loss/train': 1.926583170890808}}} +11/06/2021 23:06:57 - INFO - __main__ - Step 13526: {'lr': 0.0004925560902264766, 'samples': 2596992, 'steps': 13525, 'loss/train': 1.8510551452636719}} +11/06/2021 23:06:57 - INFO - __main__ - Step 13526: {'lr': 0.0004925560902264766, 'samples': 2596992, 'steps': 13525, 'loss/train': 1.8510551452636719}} +11/06/2021 23:06:57 - INFO - __main__ - Step 13526: {'lr': 0.0004925560902264766, 'samples': 2596992, 'steps': 13525, 'loss/train': 1.8510551452636719}} +11/06/2021 23:07:02 - INFO - __main__ - Step 13536: {'lr': 0.0004925432314054448, 'samples': 2598912, 'steps': 13535, 'loss/train': 1.898144006729126}}} +11/06/2021 23:07:05 - INFO - __main__ - Step 13541: {'lr': 0.0004925367978966588, 'samples': 2599872, 'steps': 13540, 'loss/train': 2.184403419494629}}} +11/06/2021 23:07:07 - INFO - __main__ - Step 13546: {'lr': 0.0004925303616557893, 'samples': 2600832, 'steps': 13545, 'loss/train': 1.6563913822174072}} +11/06/2021 23:07:09 - INFO - __main__ - Step 13550: {'lr': 0.0004925252106960425, 'samples': 2601600, 'steps': 13549, 'loss/train': 1.596949577331543}}} +11/06/2021 23:07:09 - INFO - __main__ - Step 13550: {'lr': 0.0004925252106960425, 'samples': 2601600, 'steps': 13549, 'loss/train': 1.596949577331543}}} +11/06/2021 23:07:12 - INFO - __main__ - Step 13557: {'lr': 0.0004925161923093001, 'samples': 2602944, 'steps': 13556, 'loss/train': 1.5300875902175903}} +11/06/2021 23:07:15 - INFO - __main__ - Step 13562: {'lr': 0.0004925097473262509, 'samples': 2603904, 'steps': 13561, 'loss/train': 1.773667573928833}}} +11/06/2021 23:07:17 - INFO - __main__ - Step 13567: {'lr': 0.000492503299611423, 'samples': 2604864, 'steps': 13566, 'loss/train': 1.2261930704116821}}} +11/06/2021 23:07:19 - INFO - __main__ - Step 13571: {'lr': 0.0004924981394727288, 'samples': 2605632, 'steps': 13570, 'loss/train': 1.4361501932144165}} +11/06/2021 23:07:19 - INFO - __main__ - Step 13571: {'lr': 0.0004924981394727288, 'samples': 2605632, 'steps': 13570, 'loss/train': 1.4361501932144165}} +11/06/2021 23:07:22 - INFO - __main__ - Step 13578: {'lr': 0.0004924891050232984, 'samples': 2606976, 'steps': 13577, 'loss/train': 1.8606226444244385}} +11/06/2021 23:07:25 - INFO - __main__ - Step 13583: {'lr': 0.0004924826485672667, 'samples': 2607936, 'steps': 13582, 'loss/train': 0.9627843499183655}} +11/06/2021 23:07:27 - INFO - __main__ - Step 13587: {'lr': 0.0004924774814357768, 'samples': 2608704, 'steps': 13586, 'loss/train': 1.7782405614852905}} +11/06/2021 23:07:27 - INFO - __main__ - Step 13587: {'lr': 0.0004924774814357768, 'samples': 2608704, 'steps': 13586, 'loss/train': 1.7782405614852905}} +11/06/2021 23:07:31 - INFO - __main__ - Step 13594: {'lr': 0.0004924684347493126, 'samples': 2610048, 'steps': 13593, 'loss/train': 1.741284966468811}}} +11/06/2021 23:07:33 - INFO - __main__ - Step 13598: {'lr': 0.0004924632628106217, 'samples': 2610816, 'steps': 13597, 'loss/train': 1.9725139141082764}} +11/06/2021 23:07:35 - INFO - __main__ - Step 13604: {'lr': 0.0004924555016250908, 'samples': 2611968, 'steps': 13603, 'loss/train': 1.9242398738861084}} +11/06/2021 23:07:35 - INFO - __main__ - Step 13604: {'lr': 0.0004924555016250908, 'samples': 2611968, 'steps': 13603, 'loss/train': 1.9242398738861084}} +11/06/2021 23:07:39 - INFO - __main__ - Step 13609: {'lr': 0.0004924490309661918, 'samples': 2612928, 'steps': 13608, 'loss/train': 0.6431192755699158}} +11/06/2021 23:07:41 - INFO - __main__ - Step 13614: {'lr': 0.000492442557576198, 'samples': 2613888, 'steps': 13613, 'loss/train': 1.7973626852035522}}} +11/06/2021 23:07:43 - INFO - __main__ - Step 13618: {'lr': 0.0004924373768978638, 'samples': 2614656, 'steps': 13617, 'loss/train': 2.0704801082611084}} +11/06/2021 23:07:45 - INFO - __main__ - Step 13622: {'lr': 0.0004924321944717129, 'samples': 2615424, 'steps': 13621, 'loss/train': 1.9337289333343506}} +11/06/2021 23:07:47 - INFO - __main__ - Step 13626: {'lr': 0.0004924270102977827, 'samples': 2616192, 'steps': 13625, 'loss/train': 2.1077988147735596}} +11/06/2021 23:07:47 - INFO - __main__ - Step 13626: {'lr': 0.0004924270102977827, 'samples': 2616192, 'steps': 13625, 'loss/train': 2.1077988147735596}} +11/06/2021 23:07:51 - INFO - __main__ - Step 13634: {'lr': 0.000492416636706734, 'samples': 2617728, 'steps': 13633, 'loss/train': 1.84334397315979}96}} +11/06/2021 23:07:53 - INFO - __main__ - Step 13638: {'lr': 0.0004924114472896902, 'samples': 2618496, 'steps': 13637, 'loss/train': 1.547655701637268}}} +11/06/2021 23:07:55 - INFO - __main__ - Step 13642: {'lr': 0.0004924062561250167, 'samples': 2619264, 'steps': 13641, 'loss/train': 1.4436631202697754}} +11/06/2021 23:07:57 - INFO - __main__ - Step 13647: {'lr': 0.0004923997647116276, 'samples': 2620224, 'steps': 13646, 'loss/train': 0.61855548620224}4}} +11/06/2021 23:07:57 - INFO - __main__ - Step 13647: {'lr': 0.0004923997647116276, 'samples': 2620224, 'steps': 13646, 'loss/train': 0.61855548620224}4}} +11/06/2021 23:07:57 - INFO - __main__ - Step 13647: {'lr': 0.0004923997647116276, 'samples': 2620224, 'steps': 13646, 'loss/train': 0.61855548620224}4}} +11/06/2021 23:08:02 - INFO - __main__ - Step 13658: {'lr': 0.0004923854739907743, 'samples': 2622336, 'steps': 13657, 'loss/train': 1.2240080833435059}} +11/06/2021 23:08:05 - INFO - __main__ - Step 13663: {'lr': 0.0004923789738399152, 'samples': 2623296, 'steps': 13662, 'loss/train': 1.5047688484191895}} +11/06/2021 23:08:05 - INFO - __main__ - Step 13663: {'lr': 0.0004923789738399152, 'samples': 2623296, 'steps': 13662, 'loss/train': 1.5047688484191895}} +11/06/2021 23:08:09 - INFO - __main__ - Step 13670: {'lr': 0.0004923698690418154, 'samples': 2624640, 'steps': 13669, 'loss/train': 0.9396169781684875}} +11/06/2021 23:08:10 - INFO - __main__ - Step 13674: {'lr': 0.0004923646638974524, 'samples': 2625408, 'steps': 13673, 'loss/train': 1.3942358493804932}} +11/06/2021 23:08:13 - INFO - __main__ - Step 13679: {'lr': 0.0004923581550098733, 'samples': 2626368, 'steps': 13678, 'loss/train': 1.6954731941223145}} +11/06/2021 23:08:15 - INFO - __main__ - Step 13684: {'lr': 0.000492351643392223, 'samples': 2627328, 'steps': 13683, 'loss/train': 2.214824914932251}5}} +11/06/2021 23:08:17 - INFO - __main__ - Step 13688: {'lr': 0.0004923464321325008, 'samples': 2628096, 'steps': 13687, 'loss/train': 2.2057156562805176}} +11/06/2021 23:08:19 - INFO - __main__ - Step 13692: {'lr': 0.0004923412191256176, 'samples': 2628864, 'steps': 13691, 'loss/train': 1.6855508089065552}} +11/06/2021 23:08:21 - INFO - __main__ - Step 13696: {'lr': 0.000492336004371611, 'samples': 2629632, 'steps': 13695, 'loss/train': 1.891566276550293}2}} +11/06/2021 23:08:23 - INFO - __main__ - Step 13700: {'lr': 0.0004923307878705186, 'samples': 2630400, 'steps': 13699, 'loss/train': 1.4887804985046387}} +11/06/2021 23:08:25 - INFO - __main__ - Step 13704: {'lr': 0.000492325569622378, 'samples': 2631168, 'steps': 13703, 'loss/train': 1.5167887210845947}}} +11/06/2021 23:08:25 - INFO - __main__ - Step 13704: {'lr': 0.000492325569622378, 'samples': 2631168, 'steps': 13703, 'loss/train': 1.5167887210845947}}} +11/06/2021 23:08:29 - INFO - __main__ - Step 13712: {'lr': 0.0004923151278851025, 'samples': 2632704, 'steps': 13711, 'loss/train': 0.9735046029090881}} +11/06/2021 23:08:29 - INFO - __main__ - Step 13712: {'lr': 0.0004923151278851025, 'samples': 2632704, 'steps': 13711, 'loss/train': 0.9735046029090881}} +11/06/2021 23:08:33 - INFO - __main__ - Step 13719: {'lr': 0.0004923059856328447, 'samples': 2634048, 'steps': 13718, 'loss/train': 1.5310945510864258}} +11/06/2021 23:08:35 - INFO - __main__ - Step 13724: {'lr': 0.0004922994521772687, 'samples': 2635008, 'steps': 13723, 'loss/train': 1.856695532798767}}} +11/06/2021 23:08:35 - INFO - __main__ - Step 13724: {'lr': 0.0004922994521772687, 'samples': 2635008, 'steps': 13723, 'loss/train': 1.856695532798767}}} +11/06/2021 23:08:35 - INFO - __main__ - Step 13724: {'lr': 0.0004922994521772687, 'samples': 2635008, 'steps': 13723, 'loss/train': 1.856695532798767}}} +11/06/2021 23:08:41 - INFO - __main__ - Step 13735: {'lr': 0.0004922850689675823, 'samples': 2637120, 'steps': 13734, 'loss/train': 0.9880645275115967}} +11/06/2021 23:08:43 - INFO - __main__ - Step 13741: {'lr': 0.000492277218012765, 'samples': 2638272, 'steps': 13740, 'loss/train': 1.6142842769622803}}} +11/06/2021 23:08:43 - INFO - __main__ - Step 13741: {'lr': 0.000492277218012765, 'samples': 2638272, 'steps': 13740, 'loss/train': 1.6142842769622803}}} +11/06/2021 23:08:47 - INFO - __main__ - Step 13748: {'lr': 0.000492268053598417, 'samples': 2639616, 'steps': 13747, 'loss/train': 2.627610445022583}}}} +11/06/2021 23:08:49 - INFO - __main__ - Step 13752: {'lr': 0.0004922628143886358, 'samples': 2640384, 'steps': 13751, 'loss/train': 2.049717903137207}}} +11/06/2021 23:08:51 - INFO - __main__ - Step 13757: {'lr': 0.0004922562629203161, 'samples': 2641344, 'steps': 13756, 'loss/train': 1.271485447883606}}} +11/06/2021 23:08:54 - INFO - __main__ - Step 13762: {'lr': 0.0004922497087230732, 'samples': 2642304, 'steps': 13761, 'loss/train': 1.9483925104141235}} +11/06/2021 23:08:54 - INFO - __main__ - Step 13762: {'lr': 0.0004922497087230732, 'samples': 2642304, 'steps': 13761, 'loss/train': 1.9483925104141235}} +11/06/2021 23:08:58 - INFO - __main__ - Step 13769: {'lr': 0.0004922405282624825, 'samples': 2643648, 'steps': 13768, 'loss/train': 0.8302810788154602}} +11/06/2021 23:08:59 - INFO - __main__ - Step 13773: {'lr': 0.0004922352798836924, 'samples': 2644416, 'steps': 13772, 'loss/train': 2.0496914386749268}} +11/06/2021 23:09:01 - INFO - __main__ - Step 13777: {'lr': 0.0004922300297585428, 'samples': 2645184, 'steps': 13776, 'loss/train': 2.127047061920166}}} +11/06/2021 23:09:04 - INFO - __main__ - Step 13782: {'lr': 0.0004922234646463451, 'samples': 2646144, 'steps': 13781, 'loss/train': 1.9466784000396729}} +11/06/2021 23:09:06 - INFO - __main__ - Step 13786: {'lr': 0.0004922182105920246, 'samples': 2646912, 'steps': 13785, 'loss/train': 1.4474611282348633}} +11/06/2021 23:09:08 - INFO - __main__ - Step 13790: {'lr': 0.0004922129547914675, 'samples': 2647680, 'steps': 13789, 'loss/train': 2.097891330718994}}} +11/06/2021 23:09:09 - INFO - __main__ - Step 13794: {'lr': 0.0004922076972447117, 'samples': 2648448, 'steps': 13793, 'loss/train': 1.157942533493042}}} +11/06/2021 23:09:11 - INFO - __main__ - Step 13798: {'lr': 0.000492202437951795, 'samples': 2649216, 'steps': 13797, 'loss/train': 1.639959454536438}}}} +11/06/2021 23:09:14 - INFO - __main__ - Step 13803: {'lr': 0.0004921958613801683, 'samples': 2650176, 'steps': 13802, 'loss/train': 1.5847387313842773}} +11/06/2021 23:09:16 - INFO - __main__ - Step 13807: {'lr': 0.0004921905981585286, 'samples': 2650944, 'steps': 13806, 'loss/train': 1.3894824981689453}} +11/06/2021 23:09:18 - INFO - __main__ - Step 13811: {'lr': 0.0004921853331908512, 'samples': 2651712, 'steps': 13810, 'loss/train': 1.9072991609573364}} +11/06/2021 23:09:19 - INFO - __main__ - Step 13815: {'lr': 0.0004921800664771743, 'samples': 2652480, 'steps': 13814, 'loss/train': 1.7779452800750732}} +11/06/2021 23:09:21 - INFO - __main__ - Step 13819: {'lr': 0.0004921747980175357, 'samples': 2653248, 'steps': 13818, 'loss/train': 1.8573100566864014}} +11/06/2021 23:09:24 - INFO - __main__ - Step 13824: {'lr': 0.0004921682099877869, 'samples': 2654208, 'steps': 13823, 'loss/train': 1.7149298191070557}} +11/06/2021 23:09:26 - INFO - __main__ - Step 13828: {'lr': 0.0004921629375998736, 'samples': 2654976, 'steps': 13827, 'loss/train': 1.5501351356506348}} +11/06/2021 23:09:28 - INFO - __main__ - Step 13832: {'lr': 0.0004921576634661221, 'samples': 2655744, 'steps': 13831, 'loss/train': 1.670548439025879}}} +11/06/2021 23:09:30 - INFO - __main__ - Step 13836: {'lr': 0.0004921523875865706, 'samples': 2656512, 'steps': 13835, 'loss/train': 1.0246696472167969}} +11/06/2021 23:09:31 - INFO - __main__ - Step 13840: {'lr': 0.0004921471099612571, 'samples': 2657280, 'steps': 13839, 'loss/train': 1.2678571939468384}} +11/06/2021 23:09:33 - INFO - __main__ - Step 13844: {'lr': 0.0004921418305902194, 'samples': 2658048, 'steps': 13843, 'loss/train': 1.7268887758255005}} +11/06/2021 23:09:36 - INFO - __main__ - Step 13849: {'lr': 0.0004921352289215561, 'samples': 2659008, 'steps': 13848, 'loss/train': 1.6378384828567505}} +11/06/2021 23:09:38 - INFO - __main__ - Step 13853: {'lr': 0.0004921299456227785, 'samples': 2659776, 'steps': 13852, 'loss/train': 1.6967663764953613}} +11/06/2021 23:09:38 - INFO - __main__ - Step 13853: {'lr': 0.0004921299456227785, 'samples': 2659776, 'steps': 13852, 'loss/train': 1.6967663764953613}} +11/06/2021 23:09:41 - INFO - __main__ - Step 13860: {'lr': 0.0004921206956495903, 'samples': 2661120, 'steps': 13859, 'loss/train': 0.5547469854354858}} +11/06/2021 23:09:44 - INFO - __main__ - Step 13866: {'lr': 0.0004921127628463972, 'samples': 2662272, 'steps': 13865, 'loss/train': 1.8773669004440308}} +11/06/2021 23:09:46 - INFO - __main__ - Step 13870: {'lr': 0.0004921074721290819, 'samples': 2663040, 'steps': 13869, 'loss/train': 1.8711230754852295}} +11/06/2021 23:09:46 - INFO - __main__ - Step 13870: {'lr': 0.0004921074721290819, 'samples': 2663040, 'steps': 13869, 'loss/train': 1.8711230754852295}} +11/06/2021 23:09:49 - INFO - __main__ - Step 13877: {'lr': 0.000492098209173842, 'samples': 2664384, 'steps': 13876, 'loss/train': 1.0459492206573486}}} +11/06/2021 23:09:51 - INFO - __main__ - Step 13881: {'lr': 0.0004920929136566632, 'samples': 2665152, 'steps': 13880, 'loss/train': 1.556997299194336}}} +11/06/2021 23:09:53 - INFO - __main__ - Step 13885: {'lr': 0.0004920876163941511, 'samples': 2665920, 'steps': 13884, 'loss/train': 1.1255569458007812}} +11/06/2021 23:09:56 - INFO - __main__ - Step 13889: {'lr': 0.0004920823173863439, 'samples': 2666688, 'steps': 13888, 'loss/train': 1.4370955228805542}} +11/06/2021 23:09:57 - INFO - __main__ - Step 13893: {'lr': 0.0004920770166332798, 'samples': 2667456, 'steps': 13892, 'loss/train': 1.972109317779541}}} +11/06/2021 23:10:00 - INFO - __main__ - Step 13898: {'lr': 0.0004920703882377403, 'samples': 2668416, 'steps': 13897, 'loss/train': 1.741361141204834}}} +11/06/2021 23:10:02 - INFO - __main__ - Step 13902: {'lr': 0.000492065083557988, 'samples': 2669184, 'steps': 13901, 'loss/train': 1.932618260383606}}}} +11/06/2021 23:10:02 - INFO - __main__ - Step 13902: {'lr': 0.000492065083557988, 'samples': 2669184, 'steps': 13901, 'loss/train': 1.932618260383606}}}} +11/06/2021 23:10:02 - INFO - __main__ - Step 13902: {'lr': 0.000492065083557988, 'samples': 2669184, 'steps': 13901, 'loss/train': 1.932618260383606}}}} +11/06/2021 23:10:07 - INFO - __main__ - Step 13912: {'lr': 0.0004920518142237352, 'samples': 2671104, 'steps': 13911, 'loss/train': 1.33417809009552}}}} +11/06/2021 23:10:10 - INFO - __main__ - Step 13917: {'lr': 0.000492045175466641, 'samples': 2672064, 'steps': 13916, 'loss/train': 1.871131181716919}}}} +11/06/2021 23:10:12 - INFO - __main__ - Step 13921: {'lr': 0.0004920398624978493, 'samples': 2672832, 'steps': 13920, 'loss/train': 1.4717364311218262}} +11/06/2021 23:10:14 - INFO - __main__ - Step 13925: {'lr': 0.0004920345477841067, 'samples': 2673600, 'steps': 13924, 'loss/train': 2.0693888664245605}} +11/06/2021 23:10:16 - INFO - __main__ - Step 13929: {'lr': 0.0004920292313254516, 'samples': 2674368, 'steps': 13928, 'loss/train': 2.1696088314056396}} +11/06/2021 23:10:17 - INFO - __main__ - Step 13933: {'lr': 0.0004920239131219223, 'samples': 2675136, 'steps': 13932, 'loss/train': 0.7648064494132996}} +11/06/2021 23:10:19 - INFO - __main__ - Step 13937: {'lr': 0.0004920185931735572, 'samples': 2675904, 'steps': 13936, 'loss/train': 1.8334205150604248}} +11/06/2021 23:10:19 - INFO - __main__ - Step 13937: {'lr': 0.0004920185931735572, 'samples': 2675904, 'steps': 13936, 'loss/train': 1.8334205150604248}} +11/06/2021 23:10:24 - INFO - __main__ - Step 13946: {'lr': 0.0004920066169103783, 'samples': 2677632, 'steps': 13945, 'loss/train': 1.0051872730255127}} +11/06/2021 23:10:26 - INFO - __main__ - Step 13950: {'lr': 0.0004920012912915616, 'samples': 2678400, 'steps': 13949, 'loss/train': 1.9164284467697144}} +11/06/2021 23:10:27 - INFO - __main__ - Step 13954: {'lr': 0.0004919959639280722, 'samples': 2679168, 'steps': 13953, 'loss/train': 3.453373432159424}}} +11/06/2021 23:10:29 - INFO - __main__ - Step 13958: {'lr': 0.0004919906348199483, 'samples': 2679936, 'steps': 13957, 'loss/train': 1.8448896408081055}} +11/06/2021 23:10:32 - INFO - __main__ - Step 13963: {'lr': 0.00049198397098146, 'samples': 2680896, 'steps': 13962, 'loss/train': 2.475085496902466}55}} +11/06/2021 23:10:34 - INFO - __main__ - Step 13967: {'lr': 0.0004919786379480494, 'samples': 2681664, 'steps': 13966, 'loss/train': 2.0461950302124023}} +11/06/2021 23:10:34 - INFO - __main__ - Step 13967: {'lr': 0.0004919786379480494, 'samples': 2681664, 'steps': 13966, 'loss/train': 2.0461950302124023}} +11/06/2021 23:10:37 - INFO - __main__ - Step 13974: {'lr': 0.0004919693009418782, 'samples': 2683008, 'steps': 13973, 'loss/train': 2.224214553833008}}} +11/06/2021 23:10:40 - INFO - __main__ - Step 13979: {'lr': 0.0004919626283809149, 'samples': 2683968, 'steps': 13978, 'loss/train': 1.7867261171340942}} +11/06/2021 23:10:40 - INFO - __main__ - Step 13979: {'lr': 0.0004919626283809149, 'samples': 2683968, 'steps': 13978, 'loss/train': 1.7867261171340942}} +11/06/2021 23:10:44 - INFO - __main__ - Step 13987: {'lr': 0.0004919519466141242, 'samples': 2685504, 'steps': 13986, 'loss/train': 2.206554889678955}}} +11/06/2021 23:10:45 - INFO - __main__ - Step 13991: {'lr': 0.0004919466031142342, 'samples': 2686272, 'steps': 13990, 'loss/train': 1.2076705694198608}} +11/06/2021 23:10:48 - INFO - __main__ - Step 13995: {'lr': 0.0004919412578700654, 'samples': 2687040, 'steps': 13994, 'loss/train': 1.2231806516647339}} +11/06/2021 23:10:50 - INFO - __main__ - Step 14000: {'lr': 0.0004919345738620218, 'samples': 2688000, 'steps': 13999, 'loss/train': 1.2765216827392578}} +11/06/2021 23:10:52 - INFO - __main__ - Step 14004: {'lr': 0.0004919292246933675, 'samples': 2688768, 'steps': 14003, 'loss/train': 1.9574697017669678}} +11/06/2021 23:10:52 - INFO - __main__ - Step 14004: {'lr': 0.0004919292246933675, 'samples': 2688768, 'steps': 14003, 'loss/train': 1.9574697017669678}} +11/06/2021 23:10:55 - INFO - __main__ - Step 14011: {'lr': 0.0004919198594513771, 'samples': 2690112, 'steps': 14010, 'loss/train': 1.3401371240615845}} +11/06/2021 23:10:58 - INFO - __main__ - Step 14016: {'lr': 0.0004919131667226398, 'samples': 2691072, 'steps': 14015, 'loss/train': 1.5199148654937744}} +11/06/2021 23:11:00 - INFO - __main__ - Step 14021: {'lr': 0.0004919064712688439, 'samples': 2692032, 'steps': 14020, 'loss/train': 1.8053239583969116}} +11/06/2021 23:11:02 - INFO - __main__ - Step 14025: {'lr': 0.0004919011129438158, 'samples': 2692800, 'steps': 14024, 'loss/train': 1.4526000022888184}} +11/06/2021 23:11:04 - INFO - __main__ - Step 14029: {'lr': 0.0004918957528748371, 'samples': 2693568, 'steps': 14028, 'loss/train': 1.5124090909957886}} +11/06/2021 23:11:06 - INFO - __main__ - Step 14033: {'lr': 0.0004918903910619465, 'samples': 2694336, 'steps': 14032, 'loss/train': 1.157104253768921}}} +11/06/2021 23:11:08 - INFO - __main__ - Step 14037: {'lr': 0.0004918850275051829, 'samples': 2695104, 'steps': 14036, 'loss/train': 2.457850217819214}}} +11/06/2021 23:11:10 - INFO - __main__ - Step 14042: {'lr': 0.0004918783206069652, 'samples': 2696064, 'steps': 14041, 'loss/train': 1.7770543098449707}} +11/06/2021 23:11:12 - INFO - __main__ - Step 14046: {'lr': 0.000491872953126628, 'samples': 2696832, 'steps': 14045, 'loss/train': 1.677998661994934}7}} +11/06/2021 23:11:12 - INFO - __main__ - Step 14046: {'lr': 0.000491872953126628, 'samples': 2696832, 'steps': 14045, 'loss/train': 1.677998661994934}7}} +11/06/2021 23:11:15 - INFO - __main__ - Step 14053: {'lr': 0.0004918635558401687, 'samples': 2698176, 'steps': 14052, 'loss/train': 2.0729172229766846}} +11/06/2021 23:11:18 - INFO - __main__ - Step 14058: {'lr': 0.0004918568402232863, 'samples': 2699136, 'steps': 14057, 'loss/train': 1.5368565320968628}} +11/06/2021 23:11:18 - INFO - __main__ - Step 14058: {'lr': 0.0004918568402232863, 'samples': 2699136, 'steps': 14057, 'loss/train': 1.5368565320968628}} +11/06/2021 23:11:22 - INFO - __main__ - Step 14066: {'lr': 0.0004918460895695037, 'samples': 2700672, 'steps': 14065, 'loss/train': 1.585329294204712}}} +11/06/2021 23:11:24 - INFO - __main__ - Step 14070: {'lr': 0.0004918407116272622, 'samples': 2701440, 'steps': 14069, 'loss/train': 1.0781822204589844}} +11/06/2021 23:11:26 - INFO - __main__ - Step 14075: {'lr': 0.0004918339867476469, 'samples': 2702400, 'steps': 14074, 'loss/train': 1.5994923114776611}} +11/06/2021 23:11:26 - INFO - __main__ - Step 14075: {'lr': 0.0004918339867476469, 'samples': 2702400, 'steps': 14074, 'loss/train': 1.5994923114776611}} +11/06/2021 23:11:26 - INFO - __main__ - Step 14075: {'lr': 0.0004918339867476469, 'samples': 2702400, 'steps': 14074, 'loss/train': 1.5994923114776611}} +11/06/2021 23:11:32 - INFO - __main__ - Step 14086: {'lr': 0.0004918191824235335, 'samples': 2704512, 'steps': 14085, 'loss/train': 1.54026198387146}1}} +11/06/2021 23:11:34 - INFO - __main__ - Step 14091: {'lr': 0.000491812448826852, 'samples': 2705472, 'steps': 14090, 'loss/train': 1.8842805624008179}}} +11/06/2021 23:11:36 - INFO - __main__ - Step 14095: {'lr': 0.0004918070599882778, 'samples': 2706240, 'steps': 14094, 'loss/train': 1.7472896575927734}} +11/06/2021 23:11:38 - INFO - __main__ - Step 14099: {'lr': 0.0004918016694064313, 'samples': 2707008, 'steps': 14098, 'loss/train': 1.9474259614944458}} +11/06/2021 23:11:40 - INFO - __main__ - Step 14103: {'lr': 0.000491796277081351, 'samples': 2707776, 'steps': 14102, 'loss/train': 1.817934274673462}8}} +11/06/2021 23:11:42 - INFO - __main__ - Step 14107: {'lr': 0.000491790883013076, 'samples': 2708544, 'steps': 14106, 'loss/train': 1.3012551069259644}}} +11/06/2021 23:11:44 - INFO - __main__ - Step 14111: {'lr': 0.0004917854872016451, 'samples': 2709312, 'steps': 14110, 'loss/train': 1.7014143466949463}} +11/06/2021 23:11:46 - INFO - __main__ - Step 14115: {'lr': 0.0004917800896470974, 'samples': 2710080, 'steps': 14114, 'loss/train': 1.9659100770950317}} +11/06/2021 23:11:47 - INFO - __main__ - Step 14119: {'lr': 0.0004917746903494717, 'samples': 2710848, 'steps': 14118, 'loss/train': 0.9476760029792786}} +11/06/2021 23:11:49 - INFO - __main__ - Step 14123: {'lr': 0.0004917692893088067, 'samples': 2711616, 'steps': 14122, 'loss/train': 1.9275217056274414}} +11/06/2021 23:11:49 - INFO - __main__ - Step 14123: {'lr': 0.0004917692893088067, 'samples': 2711616, 'steps': 14122, 'loss/train': 1.9275217056274414}} +11/06/2021 23:11:54 - INFO - __main__ - Step 14131: {'lr': 0.0004917584819985153, 'samples': 2713152, 'steps': 14130, 'loss/train': 1.5905683040618896}} +11/06/2021 23:11:54 - INFO - __main__ - Step 14131: {'lr': 0.0004917584819985153, 'samples': 2713152, 'steps': 14130, 'loss/train': 1.5905683040618896}} +11/06/2021 23:11:57 - INFO - __main__ - Step 14138: {'lr': 0.000491749019883036, 'samples': 2714496, 'steps': 14137, 'loss/train': 1.6772507429122925}}} +11/06/2021 23:11:57 - INFO - __main__ - Step 14138: {'lr': 0.000491749019883036, 'samples': 2714496, 'steps': 14137, 'loss/train': 1.6772507429122925}}} +11/06/2021 23:12:02 - INFO - __main__ - Step 14147: {'lr': 0.0004917368464631772, 'samples': 2716224, 'steps': 14146, 'loss/train': 1.4266034364700317}} +11/06/2021 23:12:04 - INFO - __main__ - Step 14151: {'lr': 0.0004917314332223295, 'samples': 2716992, 'steps': 14150, 'loss/train': 1.8678841590881348}} +11/06/2021 23:12:05 - INFO - __main__ - Step 14155: {'lr': 0.0004917260182387545, 'samples': 2717760, 'steps': 14154, 'loss/train': 1.4603012800216675}} +11/06/2021 23:12:08 - INFO - __main__ - Step 14159: {'lr': 0.0004917206015124913, 'samples': 2718528, 'steps': 14158, 'loss/train': 0.9594613313674927}} +11/06/2021 23:12:10 - INFO - __main__ - Step 14164: {'lr': 0.0004917138281540664, 'samples': 2719488, 'steps': 14163, 'loss/train': 2.4625284671783447}} +11/06/2021 23:12:10 - INFO - __main__ - Step 14164: {'lr': 0.0004917138281540664, 'samples': 2719488, 'steps': 14163, 'loss/train': 2.4625284671783447}} +11/06/2021 23:12:13 - INFO - __main__ - Step 14171: {'lr': 0.0004917043408779629, 'samples': 2720832, 'steps': 14170, 'loss/train': 1.746435523033142}}} +11/06/2021 23:12:15 - INFO - __main__ - Step 14175: {'lr': 0.0004916989171813374, 'samples': 2721600, 'steps': 14174, 'loss/train': 1.6893455982208252}} +11/06/2021 23:12:18 - INFO - __main__ - Step 14180: {'lr': 0.0004916921351101796, 'samples': 2722560, 'steps': 14179, 'loss/train': 1.529984951019287}}} +11/06/2021 23:12:18 - INFO - __main__ - Step 14180: {'lr': 0.0004916921351101796, 'samples': 2722560, 'steps': 14179, 'loss/train': 1.529984951019287}}} +11/06/2021 23:12:22 - INFO - __main__ - Step 14188: {'lr': 0.0004916812781334161, 'samples': 2724096, 'steps': 14187, 'loss/train': 1.5331050157546997}} +11/06/2021 23:12:23 - INFO - __main__ - Step 14192: {'lr': 0.0004916758470314662, 'samples': 2724864, 'steps': 14191, 'loss/train': 1.8545008897781372}} +11/06/2021 23:12:25 - INFO - __main__ - Step 14196: {'lr': 0.0004916704141871899, 'samples': 2725632, 'steps': 14195, 'loss/train': 1.6380163431167603}} +11/06/2021 23:12:28 - INFO - __main__ - Step 14201: {'lr': 0.0004916636206817575, 'samples': 2726592, 'steps': 14200, 'loss/train': 1.805939793586731}}} +11/06/2021 23:12:28 - INFO - __main__ - Step 14201: {'lr': 0.0004916636206817575, 'samples': 2726592, 'steps': 14200, 'loss/train': 1.805939793586731}}} +11/06/2021 23:12:31 - INFO - __main__ - Step 14208: {'lr': 0.0004916541052007936, 'samples': 2727936, 'steps': 14207, 'loss/train': 1.0482618808746338}} +11/06/2021 23:12:33 - INFO - __main__ - Step 14212: {'lr': 0.0004916486653876029, 'samples': 2728704, 'steps': 14211, 'loss/train': 1.552703619003296}}} +11/06/2021 23:12:36 - INFO - __main__ - Step 14217: {'lr': 0.0004916418631712481, 'samples': 2729664, 'steps': 14216, 'loss/train': 1.3125375509262085}} +11/06/2021 23:12:38 - INFO - __main__ - Step 14221: {'lr': 0.000491636419438319, 'samples': 2730432, 'steps': 14220, 'loss/train': 1.322358250617981}5}} +11/06/2021 23:12:40 - INFO - __main__ - Step 14225: {'lr': 0.0004916309739633475, 'samples': 2731200, 'steps': 14224, 'loss/train': 1.5547466278076172}} +11/06/2021 23:12:40 - INFO - __main__ - Step 14225: {'lr': 0.0004916309739633475, 'samples': 2731200, 'steps': 14224, 'loss/train': 1.5547466278076172}} +11/06/2021 23:12:43 - INFO - __main__ - Step 14232: {'lr': 0.0004916214401904763, 'samples': 2732544, 'steps': 14231, 'loss/train': 1.461196780204773}}} +11/06/2021 23:12:46 - INFO - __main__ - Step 14237: {'lr': 0.0004916146270865721, 'samples': 2733504, 'steps': 14236, 'loss/train': 2.5321567058563232}} +11/06/2021 23:12:46 - INFO - __main__ - Step 14237: {'lr': 0.0004916146270865721, 'samples': 2733504, 'steps': 14236, 'loss/train': 2.5321567058563232}} +11/06/2021 23:12:49 - INFO - __main__ - Step 14244: {'lr': 0.0004916050841686748, 'samples': 2734848, 'steps': 14243, 'loss/train': 1.6944113969802856}} +11/06/2021 23:12:52 - INFO - __main__ - Step 14249: {'lr': 0.0004915982645328304, 'samples': 2735808, 'steps': 14248, 'loss/train': 1.6930842399597168}} +11/06/2021 23:12:52 - INFO - __main__ - Step 14249: {'lr': 0.0004915982645328304, 'samples': 2735808, 'steps': 14248, 'loss/train': 1.6930842399597168}} +11/06/2021 23:12:57 - INFO - __main__ - Step 14258: {'lr': 0.0004915859823301535, 'samples': 2737536, 'steps': 14257, 'loss/train': 1.91822350025177}8}} +11/06/2021 23:12:58 - INFO - __main__ - Step 14262: {'lr': 0.0004915805207431537, 'samples': 2738304, 'steps': 14261, 'loss/train': 1.4041943550109863}} +11/06/2021 23:13:00 - INFO - __main__ - Step 14266: {'lr': 0.0004915750574145148, 'samples': 2739072, 'steps': 14265, 'loss/train': 1.9792180061340332}} +11/06/2021 23:13:03 - INFO - __main__ - Step 14271: {'lr': 0.0004915682258045958, 'samples': 2740032, 'steps': 14270, 'loss/train': 1.8175733089447021}} +11/06/2021 23:13:05 - INFO - __main__ - Step 14275: {'lr': 0.0004915627585574124, 'samples': 2740800, 'steps': 14274, 'loss/train': 1.643608570098877}}} +11/06/2021 23:13:07 - INFO - __main__ - Step 14279: {'lr': 0.0004915572895687179, 'samples': 2741568, 'steps': 14278, 'loss/train': 1.9221125841140747}} +11/06/2021 23:13:09 - INFO - __main__ - Step 14283: {'lr': 0.0004915518188385514, 'samples': 2742336, 'steps': 14282, 'loss/train': 1.557709813117981}}} +11/06/2021 23:13:10 - INFO - __main__ - Step 14287: {'lr': 0.0004915463463669527, 'samples': 2743104, 'steps': 14286, 'loss/train': 2.307543992996216}}} +11/06/2021 23:13:13 - INFO - __main__ - Step 14292: {'lr': 0.0004915395033286251, 'samples': 2744064, 'steps': 14291, 'loss/train': 1.8184715509414673}} +11/06/2021 23:13:15 - INFO - __main__ - Step 14296: {'lr': 0.000491534026938948, 'samples': 2744832, 'steps': 14295, 'loss/train': 1.8665683269500732}}} +11/06/2021 23:13:17 - INFO - __main__ - Step 14300: {'lr': 0.0004915285488079666, 'samples': 2745600, 'steps': 14299, 'loss/train': 1.6357394456863403}} +11/06/2021 23:13:19 - INFO - __main__ - Step 14304: {'lr': 0.0004915230689357206, 'samples': 2746368, 'steps': 14303, 'loss/train': 1.9127839803695679}} +11/06/2021 23:13:20 - INFO - __main__ - Step 14308: {'lr': 0.0004915175873222497, 'samples': 2747136, 'steps': 14307, 'loss/train': 1.7802067995071411}} +11/06/2021 23:13:20 - INFO - __main__ - Step 14308: {'lr': 0.0004915175873222497, 'samples': 2747136, 'steps': 14307, 'loss/train': 1.7802067995071411}} +11/06/2021 23:13:24 - INFO - __main__ - Step 14316: {'lr': 0.0004915066188717905, 'samples': 2748672, 'steps': 14315, 'loss/train': 1.671004056930542}}} +11/06/2021 23:13:24 - INFO - __main__ - Step 14316: {'lr': 0.0004915066188717905, 'samples': 2748672, 'steps': 14315, 'loss/train': 1.671004056930542}}} +11/06/2021 23:13:28 - INFO - __main__ - Step 14323: {'lr': 0.0004914970157646222, 'samples': 2750016, 'steps': 14322, 'loss/train': 1.5857484340667725}} +11/06/2021 23:13:30 - INFO - __main__ - Step 14328: {'lr': 0.0004914901531379019, 'samples': 2750976, 'steps': 14327, 'loss/train': 1.843706727027893}}} +11/06/2021 23:13:30 - INFO - __main__ - Step 14328: {'lr': 0.0004914901531379019, 'samples': 2750976, 'steps': 14327, 'loss/train': 1.843706727027893}}} +11/06/2021 23:13:34 - INFO - __main__ - Step 14336: {'lr': 0.0004914791672769713, 'samples': 2752512, 'steps': 14335, 'loss/train': 1.6169592142105103}} +11/06/2021 23:13:36 - INFO - __main__ - Step 14340: {'lr': 0.0004914736717351233, 'samples': 2753280, 'steps': 14339, 'loss/train': 0.8791477084159851}} +11/06/2021 23:13:38 - INFO - __main__ - Step 14344: {'lr': 0.0004914681744524064, 'samples': 2754048, 'steps': 14343, 'loss/train': 1.9771595001220703}} +11/06/2021 23:13:40 - INFO - __main__ - Step 14349: {'lr': 0.0004914613004009736, 'samples': 2755008, 'steps': 14348, 'loss/train': 1.3072386980056763}} +11/06/2021 23:13:40 - INFO - __main__ - Step 14349: {'lr': 0.0004914613004009736, 'samples': 2755008, 'steps': 14348, 'loss/train': 1.3072386980056763}} +11/06/2021 23:13:44 - INFO - __main__ - Step 14356: {'lr': 0.0004914516721594382, 'samples': 2756352, 'steps': 14355, 'loss/train': 1.8118442296981812}} +11/06/2021 23:13:46 - INFO - __main__ - Step 14360: {'lr': 0.0004914461679136419, 'samples': 2757120, 'steps': 14359, 'loss/train': 1.5644958019256592}} +11/06/2021 23:13:48 - INFO - __main__ - Step 14365: {'lr': 0.0004914392851585829, 'samples': 2758080, 'steps': 14364, 'loss/train': 1.7351176738739014}} +11/06/2021 23:13:51 - INFO - __main__ - Step 14370: {'lr': 0.0004914323996838036, 'samples': 2759040, 'steps': 14369, 'loss/train': 1.368338942527771}}} +11/06/2021 23:13:53 - INFO - __main__ - Step 14374: {'lr': 0.0004914268893458336, 'samples': 2759808, 'steps': 14373, 'loss/train': 1.7623484134674072}} +11/06/2021 23:13:53 - INFO - __main__ - Step 14374: {'lr': 0.0004914268893458336, 'samples': 2759808, 'steps': 14373, 'loss/train': 1.7623484134674072}} +11/06/2021 23:13:57 - INFO - __main__ - Step 14381: {'lr': 0.0004914172420662556, 'samples': 2761152, 'steps': 14380, 'loss/train': 1.8425896167755127}} +11/06/2021 23:13:59 - INFO - __main__ - Step 14385: {'lr': 0.000491411726941919, 'samples': 2761920, 'steps': 14384, 'loss/train': 1.7564046382904053}}} +11/06/2021 23:14:00 - INFO - __main__ - Step 14389: {'lr': 0.00049140621007716, 'samples': 2762688, 'steps': 14388, 'loss/train': 1.5696700811386108}}}} +11/06/2021 23:14:02 - INFO - __main__ - Step 14393: {'lr': 0.0004914006914720184, 'samples': 2763456, 'steps': 14392, 'loss/train': 1.1342967748641968}} +11/06/2021 23:14:05 - INFO - __main__ - Step 14398: {'lr': 0.0004913937907682391, 'samples': 2764416, 'steps': 14397, 'loss/train': 1.6365022659301758}} +11/06/2021 23:14:07 - INFO - __main__ - Step 14402: {'lr': 0.0004913882682473821, 'samples': 2765184, 'steps': 14401, 'loss/train': 1.6088601350784302}} +11/06/2021 23:14:09 - INFO - __main__ - Step 14406: {'lr': 0.000491382743986272, 'samples': 2765952, 'steps': 14405, 'loss/train': 2.084760904312134}2}} +11/06/2021 23:14:10 - INFO - __main__ - Step 14410: {'lr': 0.0004913772179849483, 'samples': 2766720, 'steps': 14409, 'loss/train': 1.7048285007476807}} +11/06/2021 23:14:12 - INFO - __main__ - Step 14414: {'lr': 0.000491371690243451, 'samples': 2767488, 'steps': 14413, 'loss/train': 1.3805193901062012}}} +11/06/2021 23:14:15 - INFO - __main__ - Step 14419: {'lr': 0.0004913647781195212, 'samples': 2768448, 'steps': 14418, 'loss/train': 1.5809930562973022}} +11/06/2021 23:14:15 - INFO - __main__ - Step 14419: {'lr': 0.0004913647781195212, 'samples': 2768448, 'steps': 14418, 'loss/train': 1.5809930562973022}} +11/06/2021 23:14:18 - INFO - __main__ - Step 14426: {'lr': 0.0004913550965783165, 'samples': 2769792, 'steps': 14425, 'loss/train': 1.8378410339355469}} +11/06/2021 23:14:20 - INFO - __main__ - Step 14430: {'lr': 0.0004913495618765235, 'samples': 2770560, 'steps': 14429, 'loss/train': 1.6800792217254639}} +11/06/2021 23:14:23 - INFO - __main__ - Step 14435: {'lr': 0.0004913426410524482, 'samples': 2771520, 'steps': 14434, 'loss/train': 0.5304341316223145}} +11/06/2021 23:14:25 - INFO - __main__ - Step 14439: {'lr': 0.0004913371024357694, 'samples': 2772288, 'steps': 14438, 'loss/train': 1.7349668741226196}} +11/06/2021 23:14:27 - INFO - __main__ - Step 14443: {'lr': 0.0004913315620792061, 'samples': 2773056, 'steps': 14442, 'loss/train': 1.784220576286316}}} +11/06/2021 23:14:28 - INFO - __main__ - Step 14447: {'lr': 0.0004913260199827986, 'samples': 2773824, 'steps': 14446, 'loss/train': 2.1198136806488037}} +11/06/2021 23:14:31 - INFO - __main__ - Step 14452: {'lr': 0.0004913190899156936, 'samples': 2774784, 'steps': 14451, 'loss/train': 1.592616081237793}}} +11/06/2021 23:14:33 - INFO - __main__ - Step 14456: {'lr': 0.0004913135439047821, 'samples': 2775552, 'steps': 14455, 'loss/train': 1.7716397047042847}} +11/06/2021 23:14:35 - INFO - __main__ - Step 14460: {'lr': 0.000491307996154156, 'samples': 2776320, 'steps': 14459, 'loss/train': 1.87995445728302}47}} +11/06/2021 23:14:37 - INFO - __main__ - Step 14464: {'lr': 0.0004913024466638553, 'samples': 2777088, 'steps': 14463, 'loss/train': 1.7339403629302979}} +11/06/2021 23:14:38 - INFO - __main__ - Step 14468: {'lr': 0.0004912968954339202, 'samples': 2777856, 'steps': 14467, 'loss/train': 1.555679202079773}}} +11/06/2021 23:14:40 - INFO - __main__ - Step 14472: {'lr': 0.0004912913424643904, 'samples': 2778624, 'steps': 14471, 'loss/train': 1.8691980838775635}} +11/06/2021 23:14:40 - INFO - __main__ - Step 14472: {'lr': 0.0004912913424643904, 'samples': 2778624, 'steps': 14471, 'loss/train': 1.8691980838775635}} +11/06/2021 23:14:45 - INFO - __main__ - Step 14480: {'lr': 0.0004912802313067076, 'samples': 2780160, 'steps': 14479, 'loss/train': 1.160788893699646}}} +11/06/2021 23:14:46 - INFO - __main__ - Step 14484: {'lr': 0.0004912746731186346, 'samples': 2780928, 'steps': 14483, 'loss/train': 1.4715304374694824}} +11/06/2021 23:14:49 - INFO - __main__ - Step 14488: {'lr': 0.0004912691131911272, 'samples': 2781696, 'steps': 14487, 'loss/train': 1.073344111442566}}} +11/06/2021 23:14:49 - INFO - __main__ - Step 14488: {'lr': 0.0004912691131911272, 'samples': 2781696, 'steps': 14487, 'loss/train': 1.073344111442566}}} +11/06/2021 23:14:52 - INFO - __main__ - Step 14495: {'lr': 0.0004912593791325962, 'samples': 2783040, 'steps': 14494, 'loss/train': 0.6017135977745056}} +11/06/2021 23:14:54 - INFO - __main__ - Step 14500: {'lr': 0.0004912524229724002, 'samples': 2784000, 'steps': 14499, 'loss/train': 1.174378752708435}}} +11/06/2021 23:14:57 - INFO - __main__ - Step 14505: {'lr': 0.0004912454640945889, 'samples': 2784960, 'steps': 14504, 'loss/train': 1.8055917024612427}} +11/06/2021 23:14:59 - INFO - __main__ - Step 14509: {'lr': 0.0004912398950357094, 'samples': 2785728, 'steps': 14508, 'loss/train': 2.2110788822174072}} +11/06/2021 23:14:59 - INFO - __main__ - Step 14509: {'lr': 0.0004912398950357094, 'samples': 2785728, 'steps': 14508, 'loss/train': 2.2110788822174072}} +11/06/2021 23:15:02 - INFO - __main__ - Step 14516: {'lr': 0.0004912301449977837, 'samples': 2787072, 'steps': 14515, 'loss/train': 1.7214689254760742}} +11/06/2021 23:15:05 - INFO - __main__ - Step 14521: {'lr': 0.0004912231774241298, 'samples': 2788032, 'steps': 14520, 'loss/train': 1.797451138496399}}} +11/06/2021 23:15:07 - INFO - __main__ - Step 14526: {'lr': 0.0004912162071331898, 'samples': 2788992, 'steps': 14525, 'loss/train': 1.6764172315597534}} +11/06/2021 23:15:09 - INFO - __main__ - Step 14530: {'lr': 0.0004912106289440446, 'samples': 2789760, 'steps': 14529, 'loss/train': 1.904273271560669}}} +11/06/2021 23:15:11 - INFO - __main__ - Step 14534: {'lr': 0.0004912050490159268, 'samples': 2790528, 'steps': 14533, 'loss/train': 1.7847373485565186}} +11/06/2021 23:15:12 - INFO - __main__ - Step 14538: {'lr': 0.0004911994673488766, 'samples': 2791296, 'steps': 14537, 'loss/train': 1.377058982849121}}} +11/06/2021 23:15:15 - INFO - __main__ - Step 14542: {'lr': 0.0004911938839429344, 'samples': 2792064, 'steps': 14541, 'loss/train': 1.8177210092544556}} +11/06/2021 23:15:17 - INFO - __main__ - Step 14547: {'lr': 0.0004911869022402508, 'samples': 2793024, 'steps': 14546, 'loss/train': 1.8774888515472412}} +11/06/2021 23:15:19 - INFO - __main__ - Step 14551: {'lr': 0.0004911813149219485, 'samples': 2793792, 'steps': 14550, 'loss/train': 1.7999236583709717}} +11/06/2021 23:15:19 - INFO - __main__ - Step 14551: {'lr': 0.0004911813149219485, 'samples': 2793792, 'steps': 14550, 'loss/train': 1.7999236583709717}} +11/06/2021 23:15:22 - INFO - __main__ - Step 14557: {'lr': 0.0004911729306843302, 'samples': 2794944, 'steps': 14556, 'loss/train': 1.9681403636932373}} +11/06/2021 23:15:25 - INFO - __main__ - Step 14563: {'lr': 0.000491164542534635, 'samples': 2796096, 'steps': 14562, 'loss/train': 1.9331468343734741}}} +11/06/2021 23:15:27 - INFO - __main__ - Step 14567: {'lr': 0.0004911589482615294, 'samples': 2796864, 'steps': 14566, 'loss/train': 0.8703035116195679}} +11/06/2021 23:15:29 - INFO - __main__ - Step 14571: {'lr': 0.0004911533522498239, 'samples': 2797632, 'steps': 14570, 'loss/train': 1.7870599031448364}} +11/06/2021 23:15:30 - INFO - __main__ - Step 14575: {'lr': 0.0004911477544995585, 'samples': 2798400, 'steps': 14574, 'loss/train': 1.705611228942871}}} +11/06/2021 23:15:32 - INFO - __main__ - Step 14579: {'lr': 0.0004911421550107739, 'samples': 2799168, 'steps': 14578, 'loss/train': 1.5826555490493774}} +11/06/2021 23:15:35 - INFO - __main__ - Step 14584: {'lr': 0.000491135153205062, 'samples': 2800128, 'steps': 14583, 'loss/train': 1.6225132942199707}}} +11/06/2021 23:15:37 - INFO - __main__ - Step 14588: {'lr': 0.0004911295498047565, 'samples': 2800896, 'steps': 14587, 'loss/train': 2.0302164554595947}} +11/06/2021 23:15:39 - INFO - __main__ - Step 14592: {'lr': 0.000491123944666063, 'samples': 2801664, 'steps': 14591, 'loss/train': 1.9390480518341064}}} +11/06/2021 23:15:41 - INFO - __main__ - Step 14596: {'lr': 0.0004911183377890218, 'samples': 2802432, 'steps': 14595, 'loss/train': 1.3001048564910889}} +11/06/2021 23:15:43 - INFO - __main__ - Step 14600: {'lr': 0.0004911127291736735, 'samples': 2803200, 'steps': 14599, 'loss/train': 1.4260157346725464}} +11/06/2021 23:15:45 - INFO - __main__ - Step 14605: {'lr': 0.0004911057159600551, 'samples': 2804160, 'steps': 14604, 'loss/train': 1.5187530517578125}} +11/06/2021 23:15:47 - INFO - __main__ - Step 14609: {'lr': 0.0004911001034336633, 'samples': 2804928, 'steps': 14608, 'loss/train': 1.6968247890472412}} +11/06/2021 23:15:49 - INFO - __main__ - Step 14613: {'lr': 0.0004910944891690956, 'samples': 2805696, 'steps': 14612, 'loss/train': 1.5665946006774902}} +11/06/2021 23:15:51 - INFO - __main__ - Step 14617: {'lr': 0.0004910888731663928, 'samples': 2806464, 'steps': 14616, 'loss/train': 1.519328236579895}}} +11/06/2021 23:15:53 - INFO - __main__ - Step 14621: {'lr': 0.0004910832554255951, 'samples': 2807232, 'steps': 14620, 'loss/train': 1.7540532350540161}} +11/06/2021 23:15:53 - INFO - __main__ - Step 14621: {'lr': 0.0004910832554255951, 'samples': 2807232, 'steps': 14620, 'loss/train': 1.7540532350540161}} +11/06/2021 23:15:57 - INFO - __main__ - Step 14629: {'lr': 0.0004910720147298772, 'samples': 2808768, 'steps': 14628, 'loss/train': 1.5132771730422974}} +11/06/2021 23:15:59 - INFO - __main__ - Step 14633: {'lr': 0.0004910663917750382, 'samples': 2809536, 'steps': 14632, 'loss/train': 1.8392850160598755}} +11/06/2021 23:16:01 - INFO - __main__ - Step 14638: {'lr': 0.0004910593606375261, 'samples': 2810496, 'steps': 14637, 'loss/train': 2.147937297821045}}} +11/06/2021 23:16:03 - INFO - __main__ - Step 14642: {'lr': 0.0004910537337723954, 'samples': 2811264, 'steps': 14641, 'loss/train': 1.8136534690856934}} +11/06/2021 23:16:05 - INFO - __main__ - Step 14646: {'lr': 0.0004910481051694231, 'samples': 2812032, 'steps': 14645, 'loss/train': 1.9416497945785522}} +11/06/2021 23:16:05 - INFO - __main__ - Step 14646: {'lr': 0.0004910481051694231, 'samples': 2812032, 'steps': 14645, 'loss/train': 1.9416497945785522}} +11/06/2021 23:16:09 - INFO - __main__ - Step 14653: {'lr': 0.0004910382509326627, 'samples': 2813376, 'steps': 14652, 'loss/train': 2.0839693546295166}} +11/06/2021 23:16:11 - INFO - __main__ - Step 14658: {'lr': 0.0004910312089338634, 'samples': 2814336, 'steps': 14657, 'loss/train': 1.369263768196106}}} +11/06/2021 23:16:13 - INFO - __main__ - Step 14663: {'lr': 0.0004910241642199406, 'samples': 2815296, 'steps': 14662, 'loss/train': 1.4840021133422852}} +11/06/2021 23:16:16 - INFO - __main__ - Step 14667: {'lr': 0.0004910185264939667, 'samples': 2816064, 'steps': 14666, 'loss/train': 1.7304264307022095}} +11/06/2021 23:16:16 - INFO - __main__ - Step 14667: {'lr': 0.0004910185264939667, 'samples': 2816064, 'steps': 14666, 'loss/train': 1.7304264307022095}} +11/06/2021 23:16:19 - INFO - __main__ - Step 14674: {'lr': 0.0004910086562924663, 'samples': 2817408, 'steps': 14673, 'loss/train': 1.5062963962554932}} +11/06/2021 23:16:21 - INFO - __main__ - Step 14679: {'lr': 0.0004910016028906813, 'samples': 2818368, 'steps': 14678, 'loss/train': 2.185955047607422}}} +11/06/2021 23:16:21 - INFO - __main__ - Step 14679: {'lr': 0.0004910016028906813, 'samples': 2818368, 'steps': 14678, 'loss/train': 2.185955047607422}}} +11/06/2021 23:16:21 - INFO - __main__ - Step 14679: {'lr': 0.0004910016028906813, 'samples': 2818368, 'steps': 14678, 'loss/train': 2.185955047607422}}} +11/06/2021 23:16:26 - INFO - __main__ - Step 14690: {'lr': 0.0004909860758508052, 'samples': 2820480, 'steps': 14689, 'loss/train': 1.798073172569275}}} +11/06/2021 23:16:29 - INFO - __main__ - Step 14695: {'lr': 0.0004909790137619719, 'samples': 2821440, 'steps': 14694, 'loss/train': 1.473230242729187}}} +11/06/2021 23:16:31 - INFO - __main__ - Step 14700: {'lr': 0.0004909719489586029, 'samples': 2822400, 'steps': 14699, 'loss/train': 1.9752013683319092}} +11/06/2021 23:16:31 - INFO - __main__ - Step 14700: {'lr': 0.0004909719489586029, 'samples': 2822400, 'steps': 14699, 'loss/train': 1.9752013683319092}} +11/06/2021 23:16:31 - INFO - __main__ - Step 14700: {'lr': 0.0004909719489586029, 'samples': 2822400, 'steps': 14699, 'loss/train': 1.9752013683319092}} +11/06/2021 23:16:37 - INFO - __main__ - Step 14711: {'lr': 0.0004909563968364179, 'samples': 2824512, 'steps': 14710, 'loss/train': 1.516960859298706}}} +11/06/2021 23:16:40 - INFO - __main__ - Step 14717: {'lr': 0.0004909479083234936, 'samples': 2825664, 'steps': 14716, 'loss/train': 1.4705344438552856}} +11/06/2021 23:16:40 - INFO - __main__ - Step 14717: {'lr': 0.0004909479083234936, 'samples': 2825664, 'steps': 14716, 'loss/train': 1.4705344438552856}} +11/06/2021 23:16:42 - INFO - __main__ - Step 14723: {'lr': 0.0004909394159021425, 'samples': 2826816, 'steps': 14722, 'loss/train': 1.6616466045379639}} +11/06/2021 23:16:44 - INFO - __main__ - Step 14727: {'lr': 0.0004909337521166282, 'samples': 2827584, 'steps': 14726, 'loss/train': 1.4586058855056763}} +11/06/2021 23:16:47 - INFO - __main__ - Step 14733: {'lr': 0.0004909252531815388, 'samples': 2828736, 'steps': 14732, 'loss/train': 1.6438379287719727}} +11/06/2021 23:16:47 - INFO - __main__ - Step 14733: {'lr': 0.0004909252531815388, 'samples': 2828736, 'steps': 14732, 'loss/train': 1.6438379287719727}} +11/06/2021 23:16:51 - INFO - __main__ - Step 14740: {'lr': 0.0004909153328179248, 'samples': 2830080, 'steps': 14739, 'loss/train': 1.9582070112228394}} +11/06/2021 23:16:53 - INFO - __main__ - Step 14744: {'lr': 0.0004909096616505426, 'samples': 2830848, 'steps': 14743, 'loss/train': 1.605130672454834}}} +11/06/2021 23:16:55 - INFO - __main__ - Step 14749: {'lr': 0.0004909025702489407, 'samples': 2831808, 'steps': 14748, 'loss/train': 0.686924934387207}}} +11/06/2021 23:16:57 - INFO - __main__ - Step 14753: {'lr': 0.0004908968951738098, 'samples': 2832576, 'steps': 14752, 'loss/train': 2.133230209350586}}} +11/06/2021 23:16:57 - INFO - __main__ - Step 14753: {'lr': 0.0004908968951738098, 'samples': 2832576, 'steps': 14752, 'loss/train': 2.133230209350586}}} +11/06/2021 23:17:01 - INFO - __main__ - Step 14760: {'lr': 0.0004908869596133948, 'samples': 2833920, 'steps': 14759, 'loss/train': 2.303706407546997}}} +11/06/2021 23:17:03 - INFO - __main__ - Step 14765: {'lr': 0.0004908798595283159, 'samples': 2834880, 'steps': 14764, 'loss/train': 2.077310562133789}}} +11/06/2021 23:17:03 - INFO - __main__ - Step 14765: {'lr': 0.0004908798595283159, 'samples': 2834880, 'steps': 14764, 'loss/train': 2.077310562133789}}} +11/06/2021 23:17:07 - INFO - __main__ - Step 14773: {'lr': 0.0004908684937483119, 'samples': 2836416, 'steps': 14772, 'loss/train': 1.799191951751709}}} +11/06/2021 23:17:09 - INFO - __main__ - Step 14777: {'lr': 0.0004908628082535303, 'samples': 2837184, 'steps': 14776, 'loss/train': 1.8874455690383911}} +11/06/2021 23:17:11 - INFO - __main__ - Step 14781: {'lr': 0.0004908571210222837, 'samples': 2837952, 'steps': 14780, 'loss/train': 1.470587968826294}}} +11/06/2021 23:17:11 - INFO - __main__ - Step 14781: {'lr': 0.0004908571210222837, 'samples': 2837952, 'steps': 14780, 'loss/train': 1.470587968826294}}} +11/06/2021 23:17:15 - INFO - __main__ - Step 14789: {'lr': 0.0004908457413505596, 'samples': 2839488, 'steps': 14788, 'loss/train': 1.7249447107315063}} +11/06/2021 23:17:17 - INFO - __main__ - Step 14793: {'lr': 0.000490840048910164, 'samples': 2840256, 'steps': 14792, 'loss/train': 1.8218657970428467}}} +11/06/2021 23:17:19 - INFO - __main__ - Step 14797: {'lr': 0.0004908343547334674, 'samples': 2841024, 'steps': 14796, 'loss/train': 1.586082100868225}}} +11/06/2021 23:17:21 - INFO - __main__ - Step 14802: {'lr': 0.0004908272345709861, 'samples': 2841984, 'steps': 14801, 'loss/train': 1.824029564857483}}} +11/06/2021 23:17:21 - INFO - __main__ - Step 14802: {'lr': 0.0004908272345709861, 'samples': 2841984, 'steps': 14801, 'loss/train': 1.824029564857483}}} +11/06/2021 23:17:25 - INFO - __main__ - Step 14810: {'lr': 0.0004908158366683714, 'samples': 2843520, 'steps': 14809, 'loss/train': 2.220637798309326}}} +11/06/2021 23:17:27 - INFO - __main__ - Step 14814: {'lr': 0.000490810135112854, 'samples': 2844288, 'steps': 14813, 'loss/train': 1.816659688949585}}}} +11/06/2021 23:17:29 - INFO - __main__ - Step 14818: {'lr': 0.0004908044318212512, 'samples': 2845056, 'steps': 14817, 'loss/train': 1.5969890356063843}} +11/06/2021 23:17:31 - INFO - __main__ - Step 14823: {'lr': 0.0004907973002654404, 'samples': 2846016, 'steps': 14822, 'loss/train': 1.708099603652954}}} +11/06/2021 23:17:33 - INFO - __main__ - Step 14827: {'lr': 0.0004907915930677961, 'samples': 2846784, 'steps': 14826, 'loss/train': 1.3716732263565063}} +11/06/2021 23:17:33 - INFO - __main__ - Step 14827: {'lr': 0.0004907915930677961, 'samples': 2846784, 'steps': 14826, 'loss/train': 1.3716732263565063}} +11/06/2021 23:17:37 - INFO - __main__ - Step 14834: {'lr': 0.0004907816012948098, 'samples': 2848128, 'steps': 14833, 'loss/train': 2.050675630569458}}} +11/06/2021 23:17:39 - INFO - __main__ - Step 14839: {'lr': 0.0004907744610593181, 'samples': 2849088, 'steps': 14838, 'loss/train': 1.936640739440918}}} +11/06/2021 23:17:41 - INFO - __main__ - Step 14844: {'lr': 0.000490767318111595, 'samples': 2850048, 'steps': 14843, 'loss/train': 1.6642917394638062}}} +11/06/2021 23:17:43 - INFO - __main__ - Step 14848: {'lr': 0.000490761601800664, 'samples': 2850816, 'steps': 14847, 'loss/train': 1.7513176202774048}}} +11/06/2021 23:17:45 - INFO - __main__ - Step 14852: {'lr': 0.0004907558837539976, 'samples': 2851584, 'steps': 14851, 'loss/train': 1.7864621877670288}} +11/06/2021 23:17:45 - INFO - __main__ - Step 14852: {'lr': 0.0004907558837539976, 'samples': 2851584, 'steps': 14851, 'loss/train': 1.7864621877670288}} +11/06/2021 23:17:49 - INFO - __main__ - Step 14859: {'lr': 0.0004907458729958422, 'samples': 2852928, 'steps': 14858, 'loss/train': 1.4801957607269287}} +11/06/2021 23:17:51 - INFO - __main__ - Step 14864: {'lr': 0.0004907387191999984, 'samples': 2853888, 'steps': 14863, 'loss/train': 1.4284332990646362}} +11/06/2021 23:17:51 - INFO - __main__ - Step 14864: {'lr': 0.0004907387191999984, 'samples': 2853888, 'steps': 14863, 'loss/train': 1.4284332990646362}} +11/06/2021 23:17:56 - INFO - __main__ - Step 14872: {'lr': 0.0004907272674860779, 'samples': 2855424, 'steps': 14871, 'loss/train': 2.0826239585876465}} +11/06/2021 23:17:57 - INFO - __main__ - Step 14876: {'lr': 0.0004907215390258652, 'samples': 2856192, 'steps': 14875, 'loss/train': 1.654037356376648}}} +11/06/2021 23:17:59 - INFO - __main__ - Step 14880: {'lr': 0.0004907158088302059, 'samples': 2856960, 'steps': 14879, 'loss/train': 1.6989234685897827}} +11/06/2021 23:18:02 - INFO - __main__ - Step 14885: {'lr': 0.0004907086436452231, 'samples': 2857920, 'steps': 14884, 'loss/train': 1.5355026721954346}} +11/06/2021 23:18:04 - INFO - __main__ - Step 14889: {'lr': 0.0004907029095449602, 'samples': 2858688, 'steps': 14888, 'loss/train': 1.847086787223816}}} +11/06/2021 23:18:06 - INFO - __main__ - Step 14893: {'lr': 0.0004906971737093849, 'samples': 2859456, 'steps': 14892, 'loss/train': 1.9280325174331665}} +11/06/2021 23:18:08 - INFO - __main__ - Step 14897: {'lr': 0.0004906914361385387, 'samples': 2860224, 'steps': 14896, 'loss/train': 1.7625758647918701}} +11/06/2021 23:18:09 - INFO - __main__ - Step 14901: {'lr': 0.000490685696832463, 'samples': 2860992, 'steps': 14900, 'loss/train': 1.9356876611709595}}} +11/06/2021 23:18:11 - INFO - __main__ - Step 14905: {'lr': 0.0004906799557911992, 'samples': 2861760, 'steps': 14904, 'loss/train': 1.366396427154541}}} +11/06/2021 23:18:14 - INFO - __main__ - Step 14910: {'lr': 0.0004906727770495739, 'samples': 2862720, 'steps': 14909, 'loss/train': 1.645467758178711}}} +11/06/2021 23:18:14 - INFO - __main__ - Step 14910: {'lr': 0.0004906727770495739, 'samples': 2862720, 'steps': 14909, 'loss/train': 1.645467758178711}}} +11/06/2021 23:18:17 - INFO - __main__ - Step 14917: {'lr': 0.0004906627222566924, 'samples': 2864064, 'steps': 14916, 'loss/train': 1.4498852491378784}} +11/06/2021 23:18:19 - INFO - __main__ - Step 14921: {'lr': 0.0004906569742750899, 'samples': 2864832, 'steps': 14920, 'loss/train': 1.7183939218521118}} +11/06/2021 23:18:22 - INFO - __main__ - Step 14926: {'lr': 0.0004906497868582743, 'samples': 2865792, 'steps': 14925, 'loss/train': 1.4507989883422852}} +11/06/2021 23:18:24 - INFO - __main__ - Step 14930: {'lr': 0.0004906440349730226, 'samples': 2866560, 'steps': 14929, 'loss/train': 1.1155771017074585}} +11/06/2021 23:18:24 - INFO - __main__ - Step 14930: {'lr': 0.0004906440349730226, 'samples': 2866560, 'steps': 14929, 'loss/train': 1.1155771017074585}} +11/06/2021 23:18:28 - INFO - __main__ - Step 14938: {'lr': 0.000490632525997897, 'samples': 2868096, 'steps': 14937, 'loss/train': 1.6703389883041382}}} +11/06/2021 23:18:29 - INFO - __main__ - Step 14942: {'lr': 0.0004906267689081063, 'samples': 2868864, 'steps': 14941, 'loss/train': 1.9198617935180664}} +11/06/2021 23:18:31 - INFO - __main__ - Step 14946: {'lr': 0.0004906210100835522, 'samples': 2869632, 'steps': 14945, 'loss/train': 1.7185678482055664}} +11/06/2021 23:18:34 - INFO - __main__ - Step 14950: {'lr': 0.0004906152495242763, 'samples': 2870400, 'steps': 14949, 'loss/train': 1.3722232580184937}} +11/06/2021 23:18:36 - INFO - __main__ - Step 14954: {'lr': 0.00049060948723032, 'samples': 2871168, 'steps': 14953, 'loss/train': 1.7364459037780762}7}} +11/06/2021 23:18:38 - INFO - __main__ - Step 14958: {'lr': 0.000490603723201725, 'samples': 2871936, 'steps': 14957, 'loss/train': 3.7174441814422607}}} +11/06/2021 23:18:39 - INFO - __main__ - Step 14962: {'lr': 0.0004905979574385328, 'samples': 2872704, 'steps': 14961, 'loss/train': 1.4080133438110352}} +11/06/2021 23:18:42 - INFO - __main__ - Step 14967: {'lr': 0.0004905907477953286, 'samples': 2873664, 'steps': 14966, 'loss/train': 1.8428308963775635}} +11/06/2021 23:18:44 - INFO - __main__ - Step 14972: {'lr': 0.0004905835354419625, 'samples': 2874624, 'steps': 14971, 'loss/train': 1.7392559051513672}} +11/06/2021 23:18:44 - INFO - __main__ - Step 14972: {'lr': 0.0004905835354419625, 'samples': 2874624, 'steps': 14971, 'loss/train': 1.7392559051513672}} +11/06/2021 23:18:48 - INFO - __main__ - Step 14980: {'lr': 0.0004905719900396426, 'samples': 2876160, 'steps': 14979, 'loss/train': 1.410271406173706}}} +11/06/2021 23:18:50 - INFO - __main__ - Step 14984: {'lr': 0.0004905662147369091, 'samples': 2876928, 'steps': 14983, 'loss/train': 2.0281472206115723}} +11/06/2021 23:18:50 - INFO - __main__ - Step 14984: {'lr': 0.0004905662147369091, 'samples': 2876928, 'steps': 14983, 'loss/train': 2.0281472206115723}} +11/06/2021 23:18:50 - INFO - __main__ - Step 14984: {'lr': 0.0004905662147369091, 'samples': 2876928, 'steps': 14983, 'loss/train': 2.0281472206115723}} +11/06/2021 23:18:55 - INFO - __main__ - Step 14995: {'lr': 0.000490550323711895, 'samples': 2879040, 'steps': 14994, 'loss/train': 1.996849536895752}3}} +11/06/2021 23:18:57 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 1.6460684537887573}}} +11/06/2021 23:18:57 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 1.6460684537887573}}} +11/06/2021 23:18:57 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 1.6460684537887573}}} +11/06/2021 23:18:57 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 1.6460684537887573}}} +huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks... +To disable this warning, you can either: + - Avoid using `tokenizers` before the fork if possible + - Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false) +huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks... +To disable this warning, you can either: + - Avoid using `tokenizers` before the fork if possible + - Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false) +huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks... +To disable this warning, you can either: + - Avoid using `tokenizers` before the fork if possible + - Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false) +huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks... +To disable this warning, you can either: + - Avoid using `tokenizers` before the fork if possible